2
2
* dictionary.c
3
3
*
4
4
* Copyright (C) 2003 Nadav Rotem <[email protected] >
5
- *
5
+ *
6
6
* This program is free software; you can redistribute it and/or modify
7
7
* it under the terms of the GNU General Public License as published by
8
8
* the Free Software Foundation; either version 2 of the License, or
@@ -40,28 +40,28 @@ ots_load_xml_dictionary (OtsArticle * Doc,unsigned const char *name)
40
40
xmlNodePtr stem = NULL ;
41
41
xmlNodePtr pre = NULL ;
42
42
xmlNodePtr post = NULL ;
43
- xmlNodePtr syno = NULL ; /* synonyms */
44
- xmlNodePtr manual = NULL ; /* manual */
45
- xmlNodePtr step1_pre = NULL ; /* step1 */
46
- xmlNodePtr step1_post = NULL ; /* step1 */
47
-
48
- xmlNodePtr parse = NULL ; /* parser rules */
49
- xmlNodePtr pbreak = NULL ;
50
- xmlNodePtr pdbreak = NULL ;
51
-
52
- xmlNodePtr tc_words = NULL ; /* term count dictionary */
53
- xmlNodePtr tf_words = NULL ; /* term frequency dictionary */
54
-
43
+ xmlNodePtr syno = NULL ; /* synonyms */
44
+ xmlNodePtr manual = NULL ; /* manual */
45
+ xmlNodePtr step1_pre = NULL ; /* step1 */
46
+ xmlNodePtr step1_post = NULL ; /* step1 */
47
+
48
+ xmlNodePtr parse = NULL ; /* parser rules */
49
+ xmlNodePtr pbreak = NULL ;
50
+ xmlNodePtr pdbreak = NULL ;
51
+
52
+ xmlNodePtr tc_words = NULL ; /* term count dictionary */
53
+ xmlNodePtr tf_words = NULL ; /* term frequency dictionary */
54
+
55
55
56
56
OtsStemRule * rule = Doc -> stem ;
57
-
57
+
58
58
char * local_dict_name ;
59
-
59
+
60
60
local_dict_name = g_strdup_printf ("%s.xml" , name );
61
61
62
62
63
- if (g_file_test (local_dict_name ,G_FILE_TEST_EXISTS ))
64
- doc = xmlParseFile (local_dict_name ); /* it warns to the screen so we cant use it; enable for web services only */
63
+ if (g_file_test (local_dict_name ,G_FILE_TEST_EXISTS ))
64
+ doc = xmlParseFile (local_dict_name ); /* it warns to the screen so we cant use it; enable for web services only */
65
65
if (doc == NULL ) return (FALSE);
66
66
67
67
head = xmlDocGetRootElement (doc );
@@ -82,23 +82,23 @@ ots_load_xml_dictionary (OtsArticle * Doc,unsigned const char *name)
82
82
if (head != NULL )
83
83
stem = head -> xmlChildrenNode ;
84
84
while ((stem != NULL )
85
- && (xmlStrcmp (stem -> name , (const xmlChar * ) "stemmer" )))
85
+ && (xmlStrcmp (stem -> name , (const xmlChar * ) "stemmer" )))
86
86
{
87
87
stem = stem -> next ;
88
88
}
89
89
90
90
if (head != NULL )
91
91
parse = head -> xmlChildrenNode ;
92
92
while ((parse != NULL )
93
- && (xmlStrcmp (parse -> name , (const xmlChar * ) "parser" )))
93
+ && (xmlStrcmp (parse -> name , (const xmlChar * ) "parser" )))
94
94
{
95
95
parse = parse -> next ;
96
96
}
97
97
98
98
if (head != NULL )
99
99
tc_words = head -> xmlChildrenNode ;
100
100
while ((tc_words != NULL )
101
- && (xmlStrcmp (tc_words -> name , (const xmlChar * ) "grader-tc" )))
101
+ && (xmlStrcmp (tc_words -> name , (const xmlChar * ) "grader-tc" )))
102
102
{
103
103
tc_words = tc_words -> next ;
104
104
}
@@ -107,12 +107,12 @@ ots_load_xml_dictionary (OtsArticle * Doc,unsigned const char *name)
107
107
if (head != NULL )
108
108
tf_words = head -> xmlChildrenNode ;
109
109
while ((tf_words != NULL )
110
- && (xmlStrcmp (tf_words -> name , (const xmlChar * ) "grader-tf" )))
110
+ && (xmlStrcmp (tf_words -> name , (const xmlChar * ) "grader-tf" )))
111
111
{
112
112
tf_words = tf_words -> next ;
113
113
}
114
-
115
-
114
+
115
+
116
116
117
117
if (stem != NULL )
118
118
pre = stem -> xmlChildrenNode ;
@@ -132,15 +132,15 @@ ots_load_xml_dictionary (OtsArticle * Doc,unsigned const char *name)
132
132
if (stem != NULL )
133
133
syno = stem -> xmlChildrenNode ;
134
134
while ((syno != NULL )
135
- && (xmlStrcmp (syno -> name , (const xmlChar * ) "synonyms" )))
135
+ && (xmlStrcmp (syno -> name , (const xmlChar * ) "synonyms" )))
136
136
{
137
137
syno = syno -> next ;
138
138
}
139
139
140
140
if (stem != NULL )
141
141
manual = stem -> xmlChildrenNode ;
142
142
while ((manual != NULL )
143
- && (xmlStrcmp (manual -> name , (const xmlChar * ) "manual" )))
143
+ && (xmlStrcmp (manual -> name , (const xmlChar * ) "manual" )))
144
144
{
145
145
manual = manual -> next ;
146
146
}
@@ -149,31 +149,31 @@ ots_load_xml_dictionary (OtsArticle * Doc,unsigned const char *name)
149
149
if (stem != NULL )
150
150
step1_pre = stem -> xmlChildrenNode ;
151
151
while ((step1_pre != NULL )
152
- && (xmlStrcmp (step1_pre -> name , (const xmlChar * ) "step1_pre" )))
152
+ && (xmlStrcmp (step1_pre -> name , (const xmlChar * ) "step1_pre" )))
153
153
{
154
154
step1_pre = step1_pre -> next ;
155
155
}
156
-
157
-
158
-
156
+
157
+
158
+
159
159
if (stem != NULL )
160
160
step1_post = stem -> xmlChildrenNode ;
161
161
while ((step1_post != NULL )
162
- && (xmlStrcmp (step1_post -> name , (const xmlChar * ) "step1_post" )))
162
+ && (xmlStrcmp (step1_post -> name , (const xmlChar * ) "step1_post" )))
163
163
{
164
164
step1_post = step1_post -> next ;
165
165
}
166
166
167
167
168
168
if (pre != NULL )
169
- pre = pre -> xmlChildrenNode ; /*point to first word */
169
+ pre = pre -> xmlChildrenNode ; /*point to first word */
170
170
while (pre != NULL )
171
171
{
172
172
if (0 == xmlStrcmp (pre -> name , (const xmlChar * ) "rule" ))
173
- rule -> RemovePre =
174
- g_list_append (rule -> RemovePre ,
175
- (xmlNodeListGetString
176
- (doc , pre -> xmlChildrenNode , 1 )));
173
+ rule -> RemovePre =
174
+ g_list_append (rule -> RemovePre ,
175
+ (xmlNodeListGetString
176
+ (doc , pre -> xmlChildrenNode , 1 )));
177
177
pre = pre -> next ;
178
178
}
179
179
@@ -183,10 +183,10 @@ ots_load_xml_dictionary (OtsArticle * Doc,unsigned const char *name)
183
183
while (post != NULL )
184
184
{
185
185
if (0 == xmlStrcmp (post -> name , (const xmlChar * ) "rule" ))
186
- rule -> RemovePost =
187
- g_list_append (rule -> RemovePost ,
188
- (xmlNodeListGetString
189
- (doc , post -> xmlChildrenNode , 1 )));
186
+ rule -> RemovePost =
187
+ g_list_append (rule -> RemovePost ,
188
+ (xmlNodeListGetString
189
+ (doc , post -> xmlChildrenNode , 1 )));
190
190
post = post -> next ;
191
191
}
192
192
@@ -195,10 +195,10 @@ ots_load_xml_dictionary (OtsArticle * Doc,unsigned const char *name)
195
195
while (syno != NULL )
196
196
{
197
197
if (0 == xmlStrcmp (syno -> name , (const xmlChar * ) "rule" ))
198
- rule -> synonyms =
199
- g_list_append (rule -> synonyms ,
200
- (xmlNodeListGetString
201
- (doc , syno -> xmlChildrenNode , 1 )));
198
+ rule -> synonyms =
199
+ g_list_append (rule -> synonyms ,
200
+ (xmlNodeListGetString
201
+ (doc , syno -> xmlChildrenNode , 1 )));
202
202
syno = syno -> next ;
203
203
}
204
204
@@ -207,10 +207,10 @@ ots_load_xml_dictionary (OtsArticle * Doc,unsigned const char *name)
207
207
while (manual != NULL )
208
208
{
209
209
if (0 == xmlStrcmp (manual -> name , (const xmlChar * ) "rule" ))
210
- rule -> manual =
211
- g_list_append (rule -> manual ,
212
- (xmlNodeListGetString
213
- (doc , manual -> xmlChildrenNode , 1 )));
210
+ rule -> manual =
211
+ g_list_append (rule -> manual ,
212
+ (xmlNodeListGetString
213
+ (doc , manual -> xmlChildrenNode , 1 )));
214
214
manual = manual -> next ;
215
215
}
216
216
@@ -222,10 +222,10 @@ ots_load_xml_dictionary (OtsArticle * Doc,unsigned const char *name)
222
222
while (step1_pre != NULL )
223
223
{
224
224
if (0 == xmlStrcmp (step1_pre -> name , (const xmlChar * ) "rule" ))
225
- rule -> step1_pre =
226
- g_list_append (rule -> step1_pre ,
227
- (xmlNodeListGetString
228
- (doc , step1_pre -> xmlChildrenNode , 1 )));
225
+ rule -> step1_pre =
226
+ g_list_append (rule -> step1_pre ,
227
+ (xmlNodeListGetString
228
+ (doc , step1_pre -> xmlChildrenNode , 1 )));
229
229
step1_pre = step1_pre -> next ;
230
230
}
231
231
@@ -236,10 +236,10 @@ ots_load_xml_dictionary (OtsArticle * Doc,unsigned const char *name)
236
236
while (step1_post != NULL )
237
237
{
238
238
if (0 == xmlStrcmp (step1_post -> name , (const xmlChar * ) "rule" ))
239
- rule -> step1_post =
240
- g_list_append (rule -> step1_post ,
241
- (xmlNodeListGetString
242
- (doc , step1_post -> xmlChildrenNode , 1 )));
239
+ rule -> step1_post =
240
+ g_list_append (rule -> step1_post ,
241
+ (xmlNodeListGetString
242
+ (doc , step1_post -> xmlChildrenNode , 1 )));
243
243
step1_post = step1_post -> next ;
244
244
}
245
245
@@ -258,18 +258,18 @@ ots_load_xml_dictionary (OtsArticle * Doc,unsigned const char *name)
258
258
{
259
259
pdbreak = pdbreak -> next ;
260
260
}
261
-
262
-
261
+
262
+
263
263
/*Parser break*/
264
264
if (pbreak != NULL )
265
265
pbreak = pbreak -> xmlChildrenNode ;
266
266
while (pbreak != NULL )
267
267
{
268
268
if (0 == xmlStrcmp (pbreak -> name , (const xmlChar * ) "rule" ))
269
- rule -> ParserBreak =
270
- g_list_append (rule -> ParserBreak ,
271
- (xmlNodeListGetString
272
- (doc , pbreak -> xmlChildrenNode , 1 )));
269
+ rule -> ParserBreak =
270
+ g_list_append (rule -> ParserBreak ,
271
+ (xmlNodeListGetString
272
+ (doc , pbreak -> xmlChildrenNode , 1 )));
273
273
pbreak = pbreak -> next ;
274
274
}
275
275
@@ -279,10 +279,10 @@ ots_load_xml_dictionary (OtsArticle * Doc,unsigned const char *name)
279
279
while (pdbreak != NULL )
280
280
{
281
281
if (0 == xmlStrcmp (pdbreak -> name , (const xmlChar * ) "rule" ))
282
- rule -> ParserDontBreak =
283
- g_list_append (rule -> ParserDontBreak ,
284
- (xmlNodeListGetString
285
- (doc , pdbreak -> xmlChildrenNode , 1 )));
282
+ rule -> ParserDontBreak =
283
+ g_list_append (rule -> ParserDontBreak ,
284
+ (xmlNodeListGetString
285
+ (doc , pdbreak -> xmlChildrenNode , 1 )));
286
286
pdbreak = pdbreak -> next ;
287
287
}
288
288
@@ -293,37 +293,37 @@ ots_load_xml_dictionary (OtsArticle * Doc,unsigned const char *name)
293
293
while (tc_words != NULL )
294
294
{
295
295
if (0 == xmlStrcmp (tc_words -> name , (const xmlChar * ) "word" ))
296
- {
297
- xmlChar * key ;
298
- key = xmlNodeListGetString (doc , tc_words -> xmlChildrenNode ,1 );
299
- Doc -> dict = g_list_append (Doc -> dict ,(gpointer )ots_new_wordEntery (key ));
296
+ {
297
+ xmlChar * key ;
298
+ key = xmlNodeListGetString (doc , tc_words -> xmlChildrenNode ,1 );
299
+ Doc -> dict = g_list_append (Doc -> dict ,(gpointer )ots_new_wordEntery (key ));
300
300
xmlFree (key );
301
301
}
302
302
tc_words = tc_words -> next ;
303
303
}
304
-
305
-
304
+
305
+
306
306
/*Term Frequency load dict*/
307
-
307
+
308
308
if (tf_words != NULL )
309
309
tf_words = tf_words -> xmlChildrenNode ;
310
310
while (tf_words != NULL )
311
311
{
312
312
if (0 == xmlStrcmp (tf_words -> name , (const xmlChar * ) "word" ))
313
- {
314
- xmlChar * key ;
315
- xmlChar * idf_key ;
316
- key = xmlNodeListGetString (doc , tf_words -> xmlChildrenNode ,1 );
317
-
318
- idf_key = xmlGetProp (tf_words ,"idf" );
319
- Doc -> tf_terms = g_list_append (Doc -> tf_terms ,ots_new_OtsWordTF (key ,atof (idf_key )));
313
+ {
314
+ xmlChar * key ;
315
+ xmlChar * idf_key ;
316
+ key = xmlNodeListGetString (doc , tf_words -> xmlChildrenNode ,1 );
317
+
318
+ idf_key = xmlGetProp (tf_words ,"idf" );
319
+ Doc -> tf_terms = g_list_append (Doc -> tf_terms ,ots_new_OtsWordTF (key ,atof (idf_key )));
320
320
xmlFree (key );
321
321
xmlFree (idf_key );
322
322
}
323
323
tf_words = tf_words -> next ;
324
324
}
325
-
326
-
325
+
326
+
327
327
xmlFreeDoc (doc );
328
328
xmlCleanupParser ();
329
329
g_free (local_dict_name );
0 commit comments