ChatScript
diff --git a/‎SRC/english.cpp
Lines changed: 5 additions & 2 deletions b/‎SRC/english.cpp
Lines changed: 5 additions & 2 deletions
diff --git a/‎SRC/englishTagger.cpp
Lines changed: 20 additions & 19 deletions b/‎SRC/englishTagger.cpp
Lines changed: 20 additions & 19 deletions
diff --git a/‎SRC/functionExecute.cpp
Lines changed: 1 addition & 1 deletion b/‎SRC/functionExecute.cpp
Lines changed: 1 addition & 1 deletion
diff --git a/‎SRC/mainSystem.cpp
Lines changed: 1 addition & 1 deletion b/‎SRC/mainSystem.cpp
Lines changed: 1 addition & 1 deletion
diff --git a/‎SRC/scriptCompile.cpp
Lines changed: 3 additions & 3 deletions b/‎SRC/scriptCompile.cpp
Lines changed: 3 additions & 3 deletions
diff --git a/‎SRC/topicSystem.cpp
Lines changed: 1 addition & 1 deletion b/‎SRC/topicSystem.cpp
Lines changed: 1 addition & 1 deletion
diff --git a/‎WIKI/ChatScript-System-Variables-and-Engine-defined-Concepts.md
Lines changed: 1 addition & 0 deletions b/‎WIKI/ChatScript-System-Variables-and-Engine-defined-Concepts.md
Lines changed: 1 addition & 0 deletions
diff --git a/‎WIKI/ESOTERIC-CHATSCRIPT/ChatScript-PosParser.md
Lines changed: 1 addition & 1 deletion b/‎WIKI/ESOTERIC-CHATSCRIPT/ChatScript-PosParser.md
Lines changed: 1 addition & 1 deletion
@@ -696,7 +696,10 @@ uint64 GetPosData( int at, char* original,WORDP& revise, WORDP &entry,WORDP &can
 { // this is not allowed to write properties/systemflags/internalbits if the word is preexisting
 	uint64 properties = 0;
 	sysflags = cansysflags = 0;
-	canonical = 0;
+	canonical = 0;  
+	if (at < 1) { ; } // not from sentence
+	else if (canonicalLower[at]) canonical = canonicalLower[at];  // note canonicalLower may already be set by external postagging
+	else if (canonicalUpper[at]) canonical = canonicalUpper[at];  // note canonicalUpper may already be set by external postagging
 	entry = 0;
 	if (start == 0) start = 1;
 	if (revise) revise = NULL;
@@ -970,7 +973,7 @@ uint64 GetPosData( int at, char* original,WORDP& revise, WORDP &entry,WORDP &can
 			if (participle && !strcmp(participle,original)) properties |= NOUN_ADJECTIVE;
 		}
 		WORDP canon = GetCanonical(entry);
-		if (canon) canonical = canon;
+		if (canon && !canonical) canonical = canon;
 		if (canonical) cansysflags = canonical->systemFlags;
 
 		// german postag data marks all nouns without separating singular from plural
 
@@ -720,6 +720,7 @@ static void SetCanonicalValue(int start,int end)
 		else ++lower;
 	}
 	bool caseSignificant = (lower > 3 && lower > upper);
+	bool csEnglish = !stricmp(language, "english");
 
 	// now set canonical lowercase forms
 	for (int i = start; i <= end; ++i)
@@ -734,7 +735,8 @@ static void SetCanonicalValue(int start,int end)
 		WORDP D = FindWord(original);
 		WORDP canon1 = (D) ? GetCanonical(D) : NULL;
 		char* canon =  (canon1) ? canon1->word : NULL;
-		if (posValues[i] & (DETERMINER| IDIOM) && original[1] == 0)  // treat "a" as not a letter A
+
+		if (csEnglish && posValues[i] & (DETERMINER| IDIOM) && original[1] == 0)  // treat "a" as not a letter A
 		{
 			canon = NULL;
 			canonicalLower[i] = originalLower[i];
@@ -746,7 +748,7 @@ static void SetCanonicalValue(int start,int end)
 			canonicalLower[i] = originalLower[i];
 			continue;
 		}
-		else if (allOriginalWordBits[i] & CONJUNCTION )
+		else if (csEnglish && allOriginalWordBits[i] & CONJUNCTION )
 		{
 			if (!stricmp(wordStarts[i], "times")) // a conjunction looking like plural that in singular is a normal word
 			{
@@ -757,19 +759,19 @@ static void SetCanonicalValue(int start,int end)
 		}
 
 		// a word like "won" has noun, verb, adjective meanings. We prefer a canonical that's different from the original
-		if (canon && IsUpperCase(*canon)) canonicalUpper[i] = FindWord(canon);
-		else if (canon) canonicalLower[i] = FindWord(canon);
+		if (csEnglish && canon && IsUpperCase(*canon)) canonicalUpper[i] = FindWord(canon);
+		else if (csEnglish && canon) canonicalLower[i] = FindWord(canon);
 		else if (pos & NUMBER_BITS); // must occur before verbs and nouns, since "second" is a verb and a noun
 		else if (canonicalLower[i] && canonicalLower[i]->properties & (NOUN_NUMBER|ADJECTIVE_NUMBER)); // dont change canonical numbers like December second
-		else if (allOriginalWordBits[i] & NOUN_GERUND) // because singing is a dict word, we might prefer noun over gerund. We shouldned
+		else if (csEnglish && allOriginalWordBits[i] & NOUN_GERUND) // because singing is a dict word, we might prefer noun over gerund. We shouldned
 		{
 			canonicalLower[i] = FindWord(GetInfinitive(original,false));
 		}
-		else if (pos & (VERB_BITS | NOUN_GERUND | NOUN_INFINITIVE|ADJECTIVE_PARTICIPLE) ) 
+		else if (csEnglish && pos & (VERB_BITS | NOUN_GERUND | NOUN_INFINITIVE|ADJECTIVE_PARTICIPLE) )
 		{
 			canonicalLower[i] = FindWord(GetInfinitive(original,false));
 		}
-		else if (pos & ADJECTIVE_NORMAL && !(D && D->properties & (MORE_FORM|MOST_FORM)))
+		else if (csEnglish && pos & ADJECTIVE_NORMAL && !(D && D->properties & (MORE_FORM|MOST_FORM)))
 		{
 			canonicalLower[i] = originalLower[i]; // "his *fixed view should be adjective and not participle given it is an adjective- arbitrary
 			if (allOriginalWordBits[i] & ADJECTIVE_PARTICIPLE) 
@@ -778,7 +780,7 @@ static void SetCanonicalValue(int start,int end)
 				if (verb) canonicalLower[i] = FindWord(verb);
 			}
 		}
-		else if (pos & (NOUN_BITS - NOUN_GERUND - NOUN_ADJECTIVE)  || (canonicalLower[i] && !stricmp(canonicalLower[i]->word,original))) 
+		else if (csEnglish && pos & (NOUN_BITS - NOUN_GERUND - NOUN_ADJECTIVE)  || (canonicalLower[i] && !stricmp(canonicalLower[i]->word,original)))
 		{
 			if (pos & (NOUN_PROPER_SINGULAR|NOUN_PROPER_PLURAL) && canonicalUpper[i] && canonicalUpper[i]->properties & NOUN) // can it be upper case interpretation?
 			{
@@ -793,17 +795,17 @@ static void SetCanonicalValue(int start,int end)
 			}
 			if (canonicalLower[i] && canonicalLower[i]->properties & (DETERMINER|NUMBER_BITS));
 			else if (IsAlphaUTF8(*original) &&  canonicalLower[i] && !strcmp(canonicalLower[i]->word,(char*)"unknown-word"));	// keep unknown-ness
- 			else if (pos & NOUN_BITS && !canonicalUpper[i]) 
+ 			else if (csEnglish && pos & NOUN_BITS && !canonicalUpper[i])
 			{
 				char* noun = GetSingularNoun(original,false,true);
 				if (noun) canonicalLower[i] = FindWord(noun);
 			}
-			else if (D && D->internalBits & UPPERCASE_HASH && FindWord(original, 0,LOWERCASE_LOOKUP))
+			else if (csEnglish && D && D->internalBits & UPPERCASE_HASH && FindWord(original, 0,LOWERCASE_LOOKUP))
 			{
 				canonicalLower[i] = FindWord(original,0, LOWERCASE_LOOKUP);
 			}
 		}
-		else if (pos & (ADJECTIVE_BITS - ADJECTIVE_PARTICIPLE - ADJECTIVE_NOUN) || (canonicalLower[i] && !stricmp(canonicalLower[i]->word,original))) 
+		else if (csEnglish && pos & (ADJECTIVE_BITS - ADJECTIVE_PARTICIPLE - ADJECTIVE_NOUN) || (canonicalLower[i] && !stricmp(canonicalLower[i]->word,original)))
 		{
 			if (canonicalLower[i] && canonicalLower[i]->properties & NUMBER_BITS);
 			else 
@@ -813,13 +815,13 @@ static void SetCanonicalValue(int start,int end)
 			}
 
 			// for adjectives that are verbs, like married, go canonical to the verb if adjective is unchanged
-			if (canonicalLower[i] && !strcmp(canonicalLower[i]->word,original))
+			if (csEnglish && canonicalLower[i] && !strcmp(canonicalLower[i]->word,original))
 			{
 				char* infinitive = GetInfinitive(original,false);
 				if (infinitive) canonicalLower[i] = FindWord(infinitive);
 			}
 		}
-		else if (pos & ADJECTIVE_NOUN) 
+		else if (csEnglish && pos & ADJECTIVE_NOUN)
 		{
 			if (canonicalLower[i] && canonicalLower[i]->properties & NUMBER_BITS);
 			else if (IsUpperCase(*wordStarts[i]) && caseSignificant) {;}  //  upper case is intentional
@@ -829,7 +831,7 @@ static void SetCanonicalValue(int start,int end)
 				if (adj) canonicalLower[i] = FindWord(adj);
 			}
 		}
-		else if (pos & ADVERB || (canonicalLower[i] && !stricmp(canonicalLower[i]->word,original))) 
+		else if (csEnglish && pos & ADVERB || (canonicalLower[i] && !stricmp(canonicalLower[i]->word,original)))
 		{
 			if (canonicalLower[i] && canonicalLower[i]->properties & NUMBER_BITS);
 			else canonicalLower[i] = FindWord(GetAdverbBase(original,false));
@@ -844,14 +846,14 @@ static void SetCanonicalValue(int start,int end)
 		else if (*original == '~') canonicalLower[i] = FindWord(original);
 		else if (!IsAlphaUTF8(*original)) canonicalLower[i] = FindWord(original);
 
-		if (pos & PRONOUN_BITS && !stricmp(original,(char*)"one")) // make it a number
+		if (csEnglish && pos & PRONOUN_BITS && !stricmp(original,(char*)"one")) // make it a number
 		{
 			canonicalLower[i] = StoreWord((char*)"1",NOUN|NOUN_NUMBER);
 		}
 
 		// handle composite verb canonical for single hypen case
 		char* hyphen = strchr(original,'-');
-		if (hyphen && pos & (VERB_BITS|NOUN_GERUND|ADJECTIVE_PARTICIPLE|NOUN_INFINITIVE)) // find the verb root.
+		if (csEnglish && hyphen && pos & (VERB_BITS|NOUN_GERUND|ADJECTIVE_PARTICIPLE|NOUN_INFINITIVE)) // find the verb root.
 		{
 			char word[MAX_WORD_SIZE];
 			strcpy(word,original);
@@ -881,7 +883,7 @@ static void SetCanonicalValue(int start,int end)
 			else canonicalLower[i] = can;
 		}
 		if (canonicalLower[i] && IsDigit(*canonicalLower[i]->word)) wordCanonical[i] = canonicalLower[i]->word; // leave numbers alone
-		else if (canonicalLower[i] && originalLower[i]) 
+		else if (csEnglish && canonicalLower[i] && originalLower[i])
 		{
 			if (!GetCanonical(originalLower[i]) && posValues[i] & NOUN_SINGULAR && !(allOriginalWordBits[i] & NOUN_GERUND) && stricmp(canonicalLower[i]->word,(char*)"unknown-word")) // saw does not become see, it stays original - but singing should still be sing and "what do you think of dafatgat" should remain
 			{
@@ -893,7 +895,7 @@ static void SetCanonicalValue(int start,int end)
 		else if (canonicalUpper[i]) wordCanonical[i] = canonicalUpper[i]->word;
 		else wordCanonical[i] = wordStarts[i];
 	}
-	SetSentenceTense(start,end);
+	if (csEnglish) SetSentenceTense(start,end);
 }
 
 static char* PosBits(uint64 bits, char* buff)
@@ -1387,7 +1389,6 @@ void TagIt() // get the set of all possible tags. Parse if one can to reduce thi
 	if (!externalTagger && *GetUserVariable((char*)"$cs_externaltag"))
 	{
 		// not treetagger, just a named topic
-		externalTagger = 1;
 		OnceCode((char*)"$cs_externaltag");
 	}
 
 
@@ -3132,7 +3132,7 @@ static FunctionResult SetCanonCode(char* buffer)
 	int n = atoi(arg1);
 	if (n < 1 || n > wordCount) return FAILRULE_BIT;
 	char* arg2 = ARGUMENT(2);
-	WORDP D = StoreWord(arg2);
+	WORDP D = StoreWord(arg2,AS_IS);
 	wordCanonical[n] = D->word;
 	if (!IsUpperCase(*wordCanonical[n]))
 	{
 
@@ -2967,7 +2967,7 @@ void OnceCode(const char* var,char* function) //   run before doing any of his i
 	if (BlockedBotAccess(topicid) || GAMBIT_MAX(block->topicMaxRule) == 0)
 	{
 		char word[MAX_WORD_SIZE];
-		sprintf(word,"There are no gambits in topic %s for %s.",GetTopicName(topicid),var);
+		sprintf(word,"There are no gambits in topic %s for %s or topic is blocked for this bot.",GetTopicName(topicid),var);
 		AddResponse(word,0);
 		ChangeDepth(-1,name);
         return;
 
@@ -4248,8 +4248,8 @@ char* ReadOutput(bool optionalBrace,bool nested,char* ptr, FILE* in,char* &mydat
 		}
 		if (*word == 'a' && word[2] == 0 && (word[1] == ';' || word[1] == '"' || word[1] == '\'' ) ) 
 			WARNSCRIPT((char*)"Is %s supposed to be a rejoinder marker?\r\n",word,currentFilename);
-
-		if ((*word == '}' && level == 0) || TopLevelUnit(word) || TopLevelRule(lowercaseForm) || Rejoinder(lowercaseForm) || !stricmp(word,(char*)"datum:")) //   responder definition ends when another major unit or top level responder starts
+		if (*word == '}' && level == 0 && !optionalBrace) BADSCRIPT("extra } closing nothing")
+		if ((*word == '}' && level == 0 && optionalBrace) ||  TopLevelUnit(word) || TopLevelRule(lowercaseForm) || Rejoinder(lowercaseForm) || !stricmp(word,(char*)"datum:")) //   responder definition ends when another major unit or top level responder starts
 		{
 			if (*word != ':') // allow commands here 
 			{
@@ -4690,7 +4690,7 @@ Then one of 3 kinds of character:
 			//  word is a rejoinder type
 			strcpy(kind,lowercaseForm);
 		}
-		else ReportBug((char*)"unexpected word in ReadTopLevelRule - %s",word)
+		else ReportBug((char*)"Prior script not complete- unexpected top level word %s after seeing %s", lowercaseForm, data - 20)
 	}
 
 	//   did he forget to fill in any [] jumps
 
@@ -2292,7 +2292,7 @@ static void LoadTopicData(const char* fname,const char* layerid,unsigned int bui
 		}
 		else
 		{
-			ptr = ReadInt(ptr,block->topicFlags);
+			ptr = ReadInt(ptr,block->topicFlags); //0x19 111423313 1 0 65 simpletopic.top
 			if (block->topicFlags & TOPIC_SHARE) shared = true; // need more data written into USER zone
 			ptr = ReadInt(ptr,block->topicChecksum);
  			ptr = ReadInt(ptr,topLevelRules);
 
@@ -266,6 +266,7 @@ setting them.
 | `%day`              |Sunday, etc
 | `%daynumber`        | 1-7 where 1 = Sunday
 | `%fulltime`         | seconds representing the current time and date (Unix epoch time) 
+| `%fullmstime`         | Numeric full time/date in milliseconds (Unix epoch time) 
 | `%hour`             |  0-23
 | `%timenumbers`      | completely consistent full time info in numbers that you can do <br>`_0 = ^burst(%timenumbers)`to get  `_0` =seconds (2digit) <br>`_1`=minutes (2digit) <br>`_2`=hours (2digit) <br>`_3`=dayinweek(0-6 Sunday=0) <br>`_4`=dateinmonth (1-31) <br>`_5`=month(0-11 January=0) <br>`_6`=year.<br>You need to get it simultaneously if you want to do accurate things with current time, since retrieving %hour %minute separately allows time to change between calls 
 | `%leapyear`         | boolean if current year is a leap year 
 
@@ -342,7 +342,7 @@ http://www.cis.uni-muenchen.de/~schmid/tools/TreeTagger/
 The German bot assumes you have installed TreeTagger and the german data per instructions provided
 on his website. I have only tried the Windows installation. 
 
-To use a foreign tagger, you set the `$cs_externaltag` variable in your bot definition to a topic that will
+To use a foreign tagger, you set the `$cs_externaltag` variable in your bot definition to a topic (called in Gambit mode) that will
 perform the work. And you need to disable ChatScript from performing the work. Make your bot
 definition `$cs_token` NOT use the following: `#DO_SPELLCHECK`, `#DO_PARSE`,
 `#DO_SUBSTITUTE_SYSTEM` (since that is english substitutions and punctuation processing).
Original file line number	Diff line number	Diff line change
`@@ -720,6 +720,7 @@ static void SetCanonicalValue(int start,int end)`
`720`	`720`	`else ++lower;`
`721`	`721`	`}`
`722`	`722`	`bool caseSignificant = (lower > 3 && lower > upper);`
	`723`	`+ bool csEnglish = !stricmp(language, "english");`
`723`	`724`
`724`	`725`	`// now set canonical lowercase forms`
`725`	`726`	`for (int i = start; i <= end; ++i)`
`@@ -734,7 +735,8 @@ static void SetCanonicalValue(int start,int end)`
`734`	`735`	`WORDP D = FindWord(original);`
`735`	`736`	`WORDP canon1 = (D) ? GetCanonical(D) : NULL;`
`736`	`737`	`char* canon = (canon1) ? canon1->word : NULL;`
`737`		`- if (posValues[i] & (DETERMINER\| IDIOM) && original[1] == 0) // treat "a" as not a letter A`
	`738`	`+`
	`739`	`+ if (csEnglish && posValues[i] & (DETERMINER\| IDIOM) && original[1] == 0) // treat "a" as not a letter A`
`738`	`740`	`{`
`739`	`741`	`canon = NULL;`
`740`	`742`	`canonicalLower[i] = originalLower[i];`
`@@ -746,7 +748,7 @@ static void SetCanonicalValue(int start,int end)`
`746`	`748`	`canonicalLower[i] = originalLower[i];`
`747`	`749`	`continue;`
`748`	`750`	`}`
`749`		`- else if (allOriginalWordBits[i] & CONJUNCTION )`
	`751`	`+ else if (csEnglish && allOriginalWordBits[i] & CONJUNCTION )`
`750`	`752`	`{`
`751`	`753`	`if (!stricmp(wordStarts[i], "times")) // a conjunction looking like plural that in singular is a normal word`
`752`	`754`	`{`
`@@ -757,19 +759,19 @@ static void SetCanonicalValue(int start,int end)`
`757`	`759`	`}`
`758`	`760`
`759`	`761`	`// a word like "won" has noun, verb, adjective meanings. We prefer a canonical that's different from the original`
`760`		`- if (canon && IsUpperCase(*canon)) canonicalUpper[i] = FindWord(canon);`
`761`		`- else if (canon) canonicalLower[i] = FindWord(canon);`
	`762`	`+ if (csEnglish && canon && IsUpperCase(*canon)) canonicalUpper[i] = FindWord(canon);`
	`763`	`+ else if (csEnglish && canon) canonicalLower[i] = FindWord(canon);`
`762`	`764`	`else if (pos & NUMBER_BITS); // must occur before verbs and nouns, since "second" is a verb and a noun`
`763`	`765`	`else if (canonicalLower[i] && canonicalLower[i]->properties & (NOUN_NUMBER\|ADJECTIVE_NUMBER)); // dont change canonical numbers like December second`
`764`		`- else if (allOriginalWordBits[i] & NOUN_GERUND) // because singing is a dict word, we might prefer noun over gerund. We shouldned`
	`766`	`+ else if (csEnglish && allOriginalWordBits[i] & NOUN_GERUND) // because singing is a dict word, we might prefer noun over gerund. We shouldned`
`765`	`767`	`{`
`766`	`768`	`canonicalLower[i] = FindWord(GetInfinitive(original,false));`
`767`	`769`	`}`
`768`		`- else if (pos & (VERB_BITS \| NOUN_GERUND \| NOUN_INFINITIVE\|ADJECTIVE_PARTICIPLE) )`
	`770`	`+ else if (csEnglish && pos & (VERB_BITS \| NOUN_GERUND \| NOUN_INFINITIVE\|ADJECTIVE_PARTICIPLE) )`
`769`	`771`	`{`
`770`	`772`	`canonicalLower[i] = FindWord(GetInfinitive(original,false));`
`771`	`773`	`}`
`772`		`- else if (pos & ADJECTIVE_NORMAL && !(D && D->properties & (MORE_FORM\|MOST_FORM)))`
	`774`	`+ else if (csEnglish && pos & ADJECTIVE_NORMAL && !(D && D->properties & (MORE_FORM\|MOST_FORM)))`
`773`	`775`	`{`
`774`	`776`	`canonicalLower[i] = originalLower[i]; // "his *fixed view should be adjective and not participle given it is an adjective- arbitrary`
`775`	`777`	`if (allOriginalWordBits[i] & ADJECTIVE_PARTICIPLE)`
`@@ -778,7 +780,7 @@ static void SetCanonicalValue(int start,int end)`
`778`	`780`	`if (verb) canonicalLower[i] = FindWord(verb);`
`779`	`781`	`}`
`780`	`782`	`}`
`781`		`- else if (pos & (NOUN_BITS - NOUN_GERUND - NOUN_ADJECTIVE) \|\| (canonicalLower[i] && !stricmp(canonicalLower[i]->word,original)))`
	`783`	`+ else if (csEnglish && pos & (NOUN_BITS - NOUN_GERUND - NOUN_ADJECTIVE) \|\| (canonicalLower[i] && !stricmp(canonicalLower[i]->word,original)))`
`782`	`784`	`{`
`783`	`785`	`if (pos & (NOUN_PROPER_SINGULAR\|NOUN_PROPER_PLURAL) && canonicalUpper[i] && canonicalUpper[i]->properties & NOUN) // can it be upper case interpretation?`
`784`	`786`	`{`
`@@ -793,17 +795,17 @@ static void SetCanonicalValue(int start,int end)`
`793`	`795`	`}`
`794`	`796`	`if (canonicalLower[i] && canonicalLower[i]->properties & (DETERMINER\|NUMBER_BITS));`
`795`	`797`	`else if (IsAlphaUTF8(original) && canonicalLower[i] && !strcmp(canonicalLower[i]->word,(char)"unknown-word")); // keep unknown-ness`
`796`		`- else if (pos & NOUN_BITS && !canonicalUpper[i])`
	`798`	`+ else if (csEnglish && pos & NOUN_BITS && !canonicalUpper[i])`
`797`	`799`	`{`
`798`	`800`	`char* noun = GetSingularNoun(original,false,true);`
`799`	`801`	`if (noun) canonicalLower[i] = FindWord(noun);`
`800`	`802`	`}`
`801`		`- else if (D && D->internalBits & UPPERCASE_HASH && FindWord(original, 0,LOWERCASE_LOOKUP))`
	`803`	`+ else if (csEnglish && D && D->internalBits & UPPERCASE_HASH && FindWord(original, 0,LOWERCASE_LOOKUP))`
`802`	`804`	`{`
`803`	`805`	`canonicalLower[i] = FindWord(original,0, LOWERCASE_LOOKUP);`
`804`	`806`	`}`
`805`	`807`	`}`
`806`		`- else if (pos & (ADJECTIVE_BITS - ADJECTIVE_PARTICIPLE - ADJECTIVE_NOUN) \|\| (canonicalLower[i] && !stricmp(canonicalLower[i]->word,original)))`
	`808`	`+ else if (csEnglish && pos & (ADJECTIVE_BITS - ADJECTIVE_PARTICIPLE - ADJECTIVE_NOUN) \|\| (canonicalLower[i] && !stricmp(canonicalLower[i]->word,original)))`
`807`	`809`	`{`
`808`	`810`	`if (canonicalLower[i] && canonicalLower[i]->properties & NUMBER_BITS);`
`809`	`811`	`else`
`@@ -813,13 +815,13 @@ static void SetCanonicalValue(int start,int end)`
`813`	`815`	`}`
`814`	`816`
`815`	`817`	`// for adjectives that are verbs, like married, go canonical to the verb if adjective is unchanged`
`816`		`- if (canonicalLower[i] && !strcmp(canonicalLower[i]->word,original))`
	`818`	`+ if (csEnglish && canonicalLower[i] && !strcmp(canonicalLower[i]->word,original))`
`817`	`819`	`{`
`818`	`820`	`char* infinitive = GetInfinitive(original,false);`
`819`	`821`	`if (infinitive) canonicalLower[i] = FindWord(infinitive);`
`820`	`822`	`}`
`821`	`823`	`}`
`822`		`- else if (pos & ADJECTIVE_NOUN)`
	`824`	`+ else if (csEnglish && pos & ADJECTIVE_NOUN)`
`823`	`825`	`{`
`824`	`826`	`if (canonicalLower[i] && canonicalLower[i]->properties & NUMBER_BITS);`
`825`	`827`	`else if (IsUpperCase(*wordStarts[i]) && caseSignificant) {;} // upper case is intentional`
`@@ -829,7 +831,7 @@ static void SetCanonicalValue(int start,int end)`
`829`	`831`	`if (adj) canonicalLower[i] = FindWord(adj);`
`830`	`832`	`}`
`831`	`833`	`}`
`832`		`- else if (pos & ADVERB \|\| (canonicalLower[i] && !stricmp(canonicalLower[i]->word,original)))`
	`834`	`+ else if (csEnglish && pos & ADVERB \|\| (canonicalLower[i] && !stricmp(canonicalLower[i]->word,original)))`
`833`	`835`	`{`
`834`	`836`	`if (canonicalLower[i] && canonicalLower[i]->properties & NUMBER_BITS);`
`835`	`837`	`else canonicalLower[i] = FindWord(GetAdverbBase(original,false));`
`@@ -844,14 +846,14 @@ static void SetCanonicalValue(int start,int end)`
`844`	`846`	`else if (*original == '~') canonicalLower[i] = FindWord(original);`
`845`	`847`	`else if (!IsAlphaUTF8(*original)) canonicalLower[i] = FindWord(original);`
`846`	`848`
`847`		`- if (pos & PRONOUN_BITS && !stricmp(original,(char*)"one")) // make it a number`
	`849`	`+ if (csEnglish && pos & PRONOUN_BITS && !stricmp(original,(char*)"one")) // make it a number`
`848`	`850`	`{`
`849`	`851`	`canonicalLower[i] = StoreWord((char*)"1",NOUN\|NOUN_NUMBER);`
`850`	`852`	`}`
`851`	`853`
`852`	`854`	`// handle composite verb canonical for single hypen case`
`853`	`855`	`char* hyphen = strchr(original,'-');`
`854`		`- if (hyphen && pos & (VERB_BITS\|NOUN_GERUND\|ADJECTIVE_PARTICIPLE\|NOUN_INFINITIVE)) // find the verb root.`
	`856`	`+ if (csEnglish && hyphen && pos & (VERB_BITS\|NOUN_GERUND\|ADJECTIVE_PARTICIPLE\|NOUN_INFINITIVE)) // find the verb root.`
`855`	`857`	`{`
`856`	`858`	`char word[MAX_WORD_SIZE];`
`857`	`859`	`strcpy(word,original);`
`@@ -881,7 +883,7 @@ static void SetCanonicalValue(int start,int end)`
`881`	`883`	`else canonicalLower[i] = can;`
`882`	`884`	`}`
`883`	`885`	`if (canonicalLower[i] && IsDigit(*canonicalLower[i]->word)) wordCanonical[i] = canonicalLower[i]->word; // leave numbers alone`
`884`		`- else if (canonicalLower[i] && originalLower[i])`
	`886`	`+ else if (csEnglish && canonicalLower[i] && originalLower[i])`
`885`	`887`	`{`
`886`	`888`	`if (!GetCanonical(originalLower[i]) && posValues[i] & NOUN_SINGULAR && !(allOriginalWordBits[i] & NOUN_GERUND) && stricmp(canonicalLower[i]->word,(char*)"unknown-word")) // saw does not become see, it stays original - but singing should still be sing and "what do you think of dafatgat" should remain`
`887`	`889`	`{`
`@@ -893,7 +895,7 @@ static void SetCanonicalValue(int start,int end)`
`893`	`895`	`else if (canonicalUpper[i]) wordCanonical[i] = canonicalUpper[i]->word;`
`894`	`896`	`else wordCanonical[i] = wordStarts[i];`
`895`	`897`	`}`
`896`		`- SetSentenceTense(start,end);`
	`898`	`+ if (csEnglish) SetSentenceTense(start,end);`
`897`	`899`	`}`
`898`	`900`
`899`	`901`	`static char* PosBits(uint64 bits, char* buff)`
`@@ -1387,7 +1389,6 @@ void TagIt() // get the set of all possible tags. Parse if one can to reduce thi`
`1387`	`1389`	`if (!externalTagger && GetUserVariable((char)"$cs_externaltag"))`
`1388`	`1390`	`{`
`1389`	`1391`	`// not treetagger, just a named topic`
`1390`		`- externalTagger = 1;`
`1391`	`1392`	`OnceCode((char*)"$cs_externaltag");`
`1392`	`1393`	`}`
`1393`	`1394`
Original file line number	Diff line number	Diff line change
`@@ -3132,7 +3132,7 @@ static FunctionResult SetCanonCode(char* buffer)`
`3132`	`3132`	`int n = atoi(arg1);`
`3133`	`3133`	`if (n < 1 \|\| n > wordCount) return FAILRULE_BIT;`
`3134`	`3134`	`char* arg2 = ARGUMENT(2);`
`3135`		`- WORDP D = StoreWord(arg2);`
	`3135`	`+ WORDP D = StoreWord(arg2,AS_IS);`
`3136`	`3136`	`wordCanonical[n] = D->word;`
`3137`	`3137`	`if (!IsUpperCase(*wordCanonical[n]))`
`3138`	`3138`	`{`
Original file line number	Diff line number	Diff line change
`@@ -2967,7 +2967,7 @@ void OnceCode(const char* var,char* function) // run before doing any of his i`
`2967`	`2967`	`if (BlockedBotAccess(topicid) \|\| GAMBIT_MAX(block->topicMaxRule) == 0)`
`2968`	`2968`	`{`
`2969`	`2969`	`char word[MAX_WORD_SIZE];`
`2970`		`- sprintf(word,"There are no gambits in topic %s for %s.",GetTopicName(topicid),var);`
	`2970`	`+ sprintf(word,"There are no gambits in topic %s for %s or topic is blocked for this bot.",GetTopicName(topicid),var);`
`2971`	`2971`	`AddResponse(word,0);`
`2972`	`2972`	`ChangeDepth(-1,name);`
`2973`	`2973`	`return;`
Original file line number	Diff line number	Diff line change
`@@ -4248,8 +4248,8 @@ char* ReadOutput(bool optionalBrace,bool nested,char* ptr, FILE* in,char* &mydat`
`4248`	`4248`	`}`
`4249`	`4249`	`if (*word == 'a' && word[2] == 0 && (word[1] == ';' \|\| word[1] == '"' \|\| word[1] == '\'' ) )`
`4250`	`4250`	`WARNSCRIPT((char*)"Is %s supposed to be a rejoinder marker?\r\n",word,currentFilename);`
`4251`		`-`
`4252`		`- if ((word == '}' && level == 0) \|\| TopLevelUnit(word) \|\| TopLevelRule(lowercaseForm) \|\| Rejoinder(lowercaseForm) \|\| !stricmp(word,(char)"datum:")) // responder definition ends when another major unit or top level responder starts`
	`4251`	`+ if (*word == '}' && level == 0 && !optionalBrace) BADSCRIPT("extra } closing nothing")`
	`4252`	`+ if ((word == '}' && level == 0 && optionalBrace) \|\| TopLevelUnit(word) \|\| TopLevelRule(lowercaseForm) \|\| Rejoinder(lowercaseForm) \|\| !stricmp(word,(char)"datum:")) // responder definition ends when another major unit or top level responder starts`
`4253`	`4253`	`{`
`4254`	`4254`	`if (*word != ':') // allow commands here`
`4255`	`4255`	`{`
`@@ -4690,7 +4690,7 @@ Then one of 3 kinds of character:`
`4690`	`4690`	`// word is a rejoinder type`
`4691`	`4691`	`strcpy(kind,lowercaseForm);`
`4692`	`4692`	`}`
`4693`		`- else ReportBug((char*)"unexpected word in ReadTopLevelRule - %s",word)`
	`4693`	`+ else ReportBug((char*)"Prior script not complete- unexpected top level word %s after seeing %s", lowercaseForm, data - 20)`
`4694`	`4694`	`}`
`4695`	`4695`
`4696`	`4696`	`// did he forget to fill in any [] jumps`
Original file line number	Diff line number	Diff line change
`@@ -2292,7 +2292,7 @@ static void LoadTopicData(const char* fname,const char* layerid,unsigned int bui`
`2292`	`2292`	`}`
`2293`	`2293`	`else`
`2294`	`2294`	`{`
`2295`		`- ptr = ReadInt(ptr,block->topicFlags);`
	`2295`	`+ ptr = ReadInt(ptr,block->topicFlags); //0x19 111423313 1 0 65 simpletopic.top`
`2296`	`2296`	`if (block->topicFlags & TOPIC_SHARE) shared = true; // need more data written into USER zone`
`2297`	`2297`	`ptr = ReadInt(ptr,block->topicChecksum);`
`2298`	`2298`	`ptr = ReadInt(ptr,topLevelRules);`