类文件wordsplit.class.php:
<?php
/********************************************************************
* DirCMS中文分词类 beta 1.0
* ---------------------------
* begin : 2010-5-11 beta 1.0
* update : 2010-5-11 beta 1.0
* copyright : (C) 2009 DirCMS
* email : uuturn@126.com
* author : 穆红伟 M QQ:251171960
* algorithm : 反向最大匹配算法 【注意:本文件需保存为UTF-8格式】
*
* $Id: wordsplit.class.php,v 1.0.0 2010-5-11 9:14:01 M Exp $
********************************************************************/
class wordsplit
{
public $dicloadtime; // 词典载入时间
public $splitwordstime; // 分词时间
private $starttime; // 分词开始时间
private $splitchar=' '; // 切割符,默认为空格
private $wordsdic=array(); // 词库(为键值为词,值为词频的数组) 本分次尚未用到词频
private $cnnumber='0|1|2|3|4|5|6|7|8|9|+|-|%|.|a|b|c|d|e|f|g|h|i|j|k|l|m|n|o|p|q|r|s|t|u|v|w|x|y|z|A|B|C|D|E|F|G|H|I|J|K|L|M|N|O|P|Q|R|S|T|U|V|W|X|Y|Z'; // 中文全角字母,数字
private $punctuation= array('\r','\n','\t','`','~','!','@','#','$','%','^','&','*','(',')','-','_','+','=','|','\\','\'','"',';',':','/','?','.','>',',','<','[','{',']','}','·','~','!','@','#','¥','%','……','&','×','(',')','-','——','=','+','\','|','【','{','】','}','‘','“','”',';',':','、','?','。','》',',','《',' ',' '); // 标点符号
private $trimchars=array("▲","△","▼","▽","★","☆","◆","◇","■","□","●","○","⊙","㊣","◎","▂","▁","▃","▄","▅","▆","▇","█","▏","▎","▍","▌","▋","▊","◢","◣","◥","◤","▲","▼","♀","♂","卍","※");
private $resultstr=array(); //分词结果字
根据GyPSii API提供的操作类和方法,发现请求会失败,返回的是一个bed request。原因其实很简单,但一直没有找到,最终原因是对方提供的host是错误的,没天理。
对方提供的host和uri:
host:http://dev3.gypsii.com/gypsii
uri:http://dev3.gypsii.com/gypsii/xmlservice.cgi
这个host就是错的,应该是:dev3.gypsii.co ......