Context Navigation

← Previous Changeset
Next Changeset →

Changeset 3008

Timestamp:

2002-02-27T11:55:28+13:00 (22 years ago)

Author:

jrm21

Message:

According to the c++ standard, we can't use a UCArray::iterator interchangeably
with char *, which caused errors with gcc3. We now get the address of the
character whenever we need to convert from iterator to char*.

Location:

trunk/gsdl/src/mgpp/text

Files:

: 10 edited

GSDLQueryLex.cpp (modified) (8 diffs)
Terms.cpp (modified) (1 diff)
UCArray.cpp (modified) (2 diffs)
UCArray.h (modified) (1 diff)
ivf.pass1.cpp (modified) (1 diff)
ivf.pass2.cpp (modified) (1 diff)
mgpp_perf_hash_build.cpp (modified) (1 diff)
mgpp_stem_idx.cpp (modified) (1 diff)
text.pass1.cpp (modified) (1 diff)
text.pass2.cpp (modified) (1 diff)

Legend:

: Unmodified
: Added
: Removed

trunk/gsdl/src/mgpp/text/GSDLQueryLex.cpp

-              r2693
+              r3008
   // this version of end is used in unitool
+  UCArray::const_iterator endMinus1 = end-1;
+  //  UCArray::const_iterator endMinus1 = end-1;
+  const unsigned char* endMinus1 = &(*end)-1;
   int charLen;
   unsigned short c; // one character lookahead
   charLen = parse_utf8_char (here, endMinus1, &c);
+  charLen = parse_utf8_char (&*here, endMinus1, &c);
   // check for positive or negative
 …
   if (c == '+') {
     AddNChar (here, el.text, charLen);
     charLen = parse_utf8_char (here, endMinus1, &c);
+    charLen = parse_utf8_char (&*here, endMinus1, &c);
   } else if (c == '-') {
     neg = true;
     AddNChar (here, el.text, charLen);
     charLen = parse_utf8_char (here, endMinus1, &c);
+    charLen = parse_utf8_char (&*here, endMinus1, &c);
+  }
 …
     el.num = el.num*10 + c - '0';
     AddNChar (here, el.text, charLen);
     charLen = parse_utf8_char (here, endMinus1, &c);
+    charLen = parse_utf8_char (&*here, endMinus1, &c);
+  }
 …
   // this version of end is used in unitool
+  UCArray::const_iterator endMinus1 = end-1;
+  //UCArray::const_iterator endMinus1 = end-1;
+  const unsigned char* endMinus1 = &(*end)-1;
   int charLen=0;
   int length=0;
   unsigned short c; // one character lookahead
   charLen = parse_utf8_char (here, endMinus1, &c);
+  charLen = parse_utf8_char (&*here, endMinus1, &c);
   // read in number part
 …
     AddNChar (here, el.text, charLen);
     length += charLen;
     charLen = parse_utf8_char (here, endMinus1, &c);
+    charLen = parse_utf8_char (&*here, endMinus1, &c);
+  }
   // check the next character -if it is a letter, then have a term, not an integer
 …
     AddNChar (here, el.text, charLen);
     length += charLen;
     charLen = parse_utf8_char (here, endMinus1, &c);
+    charLen = parse_utf8_char (&*here, endMinus1, &c);
+  }
 …
                UCArray::const_iterator end,
                UCArray &text) {
+  UCArray::const_iterator endMinus1 = end-1;
+  here = ParseIndexWord (here, endMinus1, text);
+  //UCArray::const_iterator endMinus1 = end-1;
+  const unsigned char* endMinus1 = &(*end)-1;
+  const unsigned char* new_here = ParseIndexWord (&*here, endMinus1, text);
+  here += (new_here - &*here); // advance iterator by number of chars advanced
   return !text.empty();
+}
 …
   // this version of end is used in unitool
+  UCArray::const_iterator endMinus1 = end-1;
+  //UCArray::const_iterator endMinus1 = end-1;
+  const unsigned char* endMinus1 = &(*end)-1;
   // ignore all white space
   int charLen;
   unsigned short c; // one character lookahead
   charLen = parse_utf8_char (here, endMinus1, &c);
+  charLen = parse_utf8_char (&*here, endMinus1, &c);
   while (here != end && is_unicode_space (c)) {
     here += charLen;
     charLen = parse_utf8_char (here, endMinus1, &c);
+    charLen = parse_utf8_char (&*here, endMinus1, &c);
+  }
   if (here == end) return false;

trunk/gsdl/src/mgpp/text/Terms.cpp

r2468	r3008
244	244	// convert the word to an "mg word"
245	245	mgWord[0] = term.size();
246		memcpy ((char )&mgWord[1], ~~(const char )term.begin(~~), term.size());
	246	memcpy ((char *)&mgWord[1], &(term[0]), term.size());
247	247
248	248	// stem the word

trunk/gsdl/src/mgpp/text/UCArray.cpp

-              r2468
+              r3008
   int i = 0;
   while (here != end) {
     cstr[i] = (char)*here;
+    cstr[i] = text[i];
     here++; i++;
+  }
 …
   fputc (sufLen, f);
   if (ferror(f) != 0) return false;
+  return (fwrite ((char *)a.begin()+preLen, sizeof (char), sufLen, f) == sufLen);
+  char* tmp=GetCStr(a);
+  int ret=(fwrite (tmp+preLen, sizeof (char), sufLen, f) == sufLen);
+  delete (tmp);
+  return (ret);
+}

trunk/gsdl/src/mgpp/text/UCArray.h

r2468	r3008
24	24
25	25	// need this to avoid bizarre compiler problems under VC++ 6.0
26		#if ~~defined (__WIN32__~~) && !defined (GSDL_USE_IOS_H)
	26	#if !defined (GSDL_NAMESPACE_BROKEN) && !defined (GSDL_USE_IOS_H)
27	27	# include <iostream>
28	28	using namespace std;

trunk/gsdl/src/mgpp/text/ivf.pass1.cpp

-              r2468
+              r3008
   if (!wordLevelIndex && !inFrag) return;
   const unsigned char *textHere = el.text.begin();
   const unsigned char *textEnd = el.text.end() - 1;
+  const unsigned char *textHere = &(el.text[0]);
+  const unsigned char *textEnd = &(el.text[el.text.size() - 1]);
   UCArray word;

trunk/gsdl/src/mgpp/text/ivf.pass2.cpp

-              r2468
+              r3008
   if (!wordLevelIndex && !inFrag) return;
   const unsigned char *textHere = el.text.begin();
   const unsigned char *textEnd = el.text.end() - 1;
+  const unsigned char *textHere = &(el.text[0]);
+  const unsigned char *textEnd = &(el.text[el.text.size() - 1]);
   unsigned char mgWord[MAXSTEMLEN + 1];

trunk/gsdl/src/mgpp/text/mgpp_perf_hash_build.cpp

r2557	r3008
93	93
94	94	*pool++ = wordEl.el.size();
95		memcpy ((char ) pool, ~~(const char ) wordEl.el.begin(~~), wordEl.el.size());
	95	memcpy ((char *) pool, &(wordEl.el[0]), wordEl.el.size());
96	96	//cerr << pool<<" " <<starts[i]<<endl;
97	97	pool += wordEl.el.size();

trunk/gsdl/src/mgpp/text/mgpp_stem_idx.cpp

r2557	r3008
76	76	// convert the word to an "mg word"
77	77	mgWord[0] = wordEl.el.size();
78		memcpy((char )&mgWord[1], ~~(const char )wordEl.el.begin(~~), wordEl.el.size());
	78	memcpy((char *)&mgWord[1], &(wordEl.el[0]), wordEl.el.size());
79	79
80	80	// stem the word

trunk/gsdl/src/mgpp/text/text.pass1.cpp

r2698	r3008
269	269	docLen += textLen;
270	270
271		retValue = process_text_element (~~(*here).text.begin(~~), textLen);
	271	retValue = process_text_element (&(here->text[0]), textLen);
272	272	if (retValue != COMPALLOK) return retValue;
273	273

trunk/gsdl/src/mgpp/text/text.pass2.cpp

r2541	r3008
384	384	// compress the text
385	385	if (compress_text (textOutBuf,
386		~~(*here).text.begin(~~),
	386	&(here->text[0]),
387	387	(*here).text.size(),
388	388	whichWordType,

Note: See TracChangeset for help on using the changeset viewer.

Context Navigation

Changeset 3008

Legend:

Download in other formats: