数据库

本类阅读TOP10

·SQL语句导入导出大全
·SQL Server日期计算
·SQL语句导入导出大全
·SQL to Excel 的应用
·Oracle中password file的作用及说明
·MS SQLServer OLEDB分布式事务无法启动的一般解决方案
·sqlserver2000数据库置疑的解决方法
·一个比较实用的大数据量分页存储过程
·如何在正运行 SQL Server 7.0 的服务器之间传输登录和密码
·SQL中两台服务器间使用连接服务器

分类导航
VC语言Delphi
VB语言ASP
PerlJava
Script数据库
其他语言游戏开发
文件格式网站制作
软件工程.NET开发
如何将全文检索中的“干扰词”去除

作者:未知 来源:月光软件站 加入时间:2005-2-28 月光软件站

包括以下内容,然后调用:remove_noise_word()即可

 

<SCRIPT LANGUAGE=javascript>
<!--
  noise_word_list_ch = new Array("?","about","$","1","2","3","4","5","6","7","8","9","0","_",
        "a","b","c","d","e","f","g","h","i","j","k","l","m","n","o",
        "p","q","r","s","t","u","v","w","x","y","z","after","all","also",
        "an","and","another","any","are","as","at","be","because","been",
        "before","being","between","both","but","by","came","can","come",
        "could","did","do","each","for","from","get","got","had","has",
        "have","he","her","here","him","himself","his","how","if","in","into",
        "is","it","like","make","many","me","might","more","most","much","must",
        "my","never","now","of","on","only","or","other","our","out","over","said",
        "same","see","should","since","some","still","such","take","than","that",
        "the","their","them","then","there","these","they","this","those","through",
        "to","too","under","up","very","was","way","we","well","were","what","where",
        "which","while","who","with","would","you","your",
        "的","一","不","在","人","有","是","为","以","于","上","他","而","后","之","来",
        "及","了","因","下","可","到","由","这","与","也","此","但","并","个","其","已",
         "无","小","我","们","起","最","再","今","去","好","只","又","或","很","亦","某",
        "把","那","你","乃","它");

function trim_str_key(inputVal){
 inputStr = inputVal.toString()
 while ((inputStr.charAt(inputStr.length - 1) == " ") || (inputStr.charAt(0) == " ")){     

    //如果最右边为空格则删去
    if (inputStr.charAt(inputStr.length - 1) == " "){
         inputStr = inputStr.substring(0,inputStr.length - 1)
    }
    //如果最左边为空格则删去
    if (inputStr.charAt(0) == " "){
       inputStr = inputStr.substring(1,inputStr.length)
    }
 }
 return inputStr
}

function is_ch_noise_word(str_key){
   var key_word = trim_str_key(str_key);
   key_word = key_word.toLowerCase();
   var listlength=noise_word_list_ch.length;
   var tmp_str = "";
   for(i=0;i<listlength;i++){
      tmp_str = noise_word_list_ch[i]
      if(tmp_str==key_word){ 
         return true;
      }
   }
   return false;

function remove_noise_word(str_source){
  var tmp_str = "";
  var ch = "";
  var str_out = "";
  var i = 0;
  str_source = trim_str_key(str_source); 
  var str_source_length = str_source.length;
 
  if(str_source_length == 0){
    return str_out;
  }
  
  for (i=0;i < str_source_length; i++){ 
    ch = str_source.charAt(i);
    if(ch==" "){ //如果为空格则表示是下一个关键词
  if(!(is_ch_noise_word(tmp_str))){ //不是干扰词就输出
     if(tmp_str!=" "){  //防止连续的两个空格
       str_out = str_out + tmp_str + " ";
     } 
  }
  tmp_str = "";
    }
    else{
       tmp_str = tmp_str + ch;
    }
  }
  str_out = str_out + tmp_str;   
  return trim_str_key(str_out); 
}

//下面是一个测试
//var abc = "av  n";
//var nnnn = remove_noise_word(abc);
//alert(nnnn);
//-->
</SCRIPT>




相关文章

相关软件