//***********************************************************
// Copyright © 2008 Valentin Pavlyuchenko
//
// This file is part of Boltun.
//
// Boltun is free software: you can redistribute it and/or modify
// it under the terms of the GNU General Public License as published by
// the Free Software Foundation, either version 2 of the License, or
// (at your option) any later version.
//
// Boltun is distributed in the hope that it will be useful,
// but WITHOUT ANY WARRANTY; without even the implied warranty of
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
// GNU General Public License for more details.
//
// You should have received a copy of the GNU General Public License
// along with Boltun. If not, see .
//
//***********************************************************
#include "../stdafx.h"
#ifdef _DEBUG
//#define DEBUG_PREFIXES
//#define DEBUG_SHOW_LEVEL
//#define DEBUG_SHOW_VARIANTS
//#define DEBUG_SHOW_SOLUTION_REASON
#endif
//Enabling next define will make a bot more stupid:
//#define EXCLUDE_SPECIAL_WORDS
#ifdef DEBUG_SHOW_VARIANTS
extern void AddBotMessage(wstring s);
#endif
using namespace std;
void TalkBot::UpdateStartChar(wstring &str)
{
if (!makeLowercase)
return;
size_t l = str.length();
if (l) {
// Answers starting with ' ' must remain unchanged.
if (str[0] == ' ') {
str = str.substr(1);
return;
}
wchar_t *strl = NEWWSTR_ALLOCA(str.c_str()), *stru = NEWWSTR_ALLOCA(str.c_str());
CharLower(strl);
CharUpper(stru);
for (size_t i = 0; i < l; i++) {
wchar_t cl = strl[i];
wchar_t cu = stru[i];
if (i != l - 1) {
// Do not react to BLONDE ANSWERS
wchar_t ncl = strl[i+1];
wchar_t ncu = stru[i+1];
if (ncl != ncu && str[i+1] == ncu)
break;
}
if (cl != cu) {
str[i] = cl;
break;
}
}
}
}
TalkBot::TalkBot(const Mind& goodMind)
:mind(goodMind), beSilent(false), makeLowercase(false),
understandAlways(false)
{
contactDatas = new PerContactData(mind);
}
TalkBot::~TalkBot()
{
delete contactDatas;
}
wstring TalkBot::GetInitMessage(MCONTACT contact)
{
ContactData* d = contactDatas->GetData(contact);
wstring s = d->initial.GetString();
contactDatas->PutData(contact);
return s;
}
wstring TalkBot::ReplaceAliases(const wstring &message)
{
const wchar_t dividers[] = L" \t\n\r,./?\\|;:'\"~!#^&*()_-+=[{]}—\1";
wstring sentence = message;
wstring result;
map sm;
//Find smiles
for (size_t i = 0; i < sentence.length() - 1; i++) {
unsigned max = (int)(sentence.length() - i);
if (max > mind.GetData()->maxSmileLen)
max = mind.GetData()->maxSmileLen;
for (unsigned j = max; j > 0; j--) {
wstring item = sentence.substr(i, j);
if (mind.GetData()->smiles.find(item) != mind.GetData()->smiles.end()) {
sm[i] = item;
sentence.replace(i, j, L"\1");
break;
}
}
}
int len = (int)sentence.length();
bool hadQuestionSigns = false;
int it = 0;
while (it != len) {
while (it != len && wcschr(dividers, sentence[it])) {
if (sentence[it] == '?')
hadQuestionSigns = true;
map::iterator smit;
if (sentence[it] == '\1') {
smit = sm.find(it);
result.append((*smit).second);
}
else
result.push_back(sentence[it]);
it++;
}
if (it == len)
break;
int start = it;
while (true) {
while (it != len && !wcschr(dividers, sentence[it]))
it++;
if (it == len || sentence[it] != '-')
break;
//If we have-a-word-with-minus, we shouldn't split it
if (wcschr(dividers, sentence[it + 1]))
break;
it += 2;
}
wstring str = sentence.substr(start, it - start);
map::const_iterator al = mind.GetData()->aliases.find(str);
if (al != mind.GetData()->aliases.end())
result.append((*al).second);
else
result.append(str);
}
return result;
}
wstring TalkBot::AllReplies(const wstring &incomingMessage, ContactData *contactData, Level &maxValue, std::multimap &mm)
{
wstring res;
//Part 1
if (FindExact(contactData, incomingMessage, mind.GetData()->widelyUsed, res)) //widelyUsed
{
return res;
}
//Part 2
if (FindExact(contactData, incomingMessage, mind.GetData()->study, res)) //study
{
#ifdef DEBUG_PREFIXES
mm.insert(make_pair(LOOKSLIKE, L"(study_all) " + res));
#else
mm.insert(make_pair(LOOKSLIKE, res));
#endif
maxValue = LOOKSLIKE;
}
//Part 3
vector sentences;
SplitSectences(incomingMessage, sentences);
ValueChooser<> ch(sentences, true); //Using random order of sentences.
while ((res = ch.GetString()) != L"") {
//Part 4
if (FindExact(contactData, res, mind.GetData()->widelyUsed, res)) //widelyUsed
{
#ifdef DEBUG_PREFIXES
mm.insert(make_pair(BEST, L"(widelyused_sent) " + res));
#else
mm.insert(make_pair(BEST, res));
#endif
if (maxValue > BEST)
maxValue = BEST;
}
//Part 5
if (FindExact(contactData, res, mind.GetData()->study, res)) //study
{
#ifdef DEBUG_PREFIXES
mm.insert(make_pair(LOOKSLIKE, L"(study_sent) " + res));
#else
mm.insert(make_pair(LOOKSLIKE, res));
#endif
if (maxValue > LOOKSLIKE)
maxValue = LOOKSLIKE;
}
//Part 6
vector keywords, otherwords;
bool isQuestion;
SplitAndSortWords(res, keywords, otherwords, isQuestion);
//Part 7, 8
res = L"";
FindByKeywords(contactData, keywords, res/*, ures*/, isQuestion); //keywords
if (res != L"") {
#ifdef DEBUG_PREFIXES
mm.insert(make_pair(LOOKSLIKE, L"(keywords) " + res));
#else
mm.insert(make_pair(LOOKSLIKE, res));
#endif
if (maxValue > LOOKSLIKE)
maxValue = LOOKSLIKE;
}
/* if (ures != L"")
{
#ifdef DEBUG_PREFIXES
mm.insert(make_pair(LOOKSLIKE2, L"(keywords_unstrict) "+ures));
#else
mm.insert(make_pair(LOOKSLIKE2, ures));
#endif
if (maxValue > LOOKSLIKE2)
maxValue = LOOKSLIKE2;
}*/
//Part 9
if (FindByOthers(contactData, otherwords, res, isQuestion)) //specialEscapes
{
#ifdef DEBUG_PREFIXES
mm.insert(make_pair(BAD, L"(otherwords) " + res));
#else
mm.insert(make_pair(BAD, res));
#endif
if (maxValue > BAD)
maxValue = BAD;
}
}
if (!beSilent) {
//Part 10
if (FindAny(contactData->escape, res)) //escape
{
#ifdef DEBUG_PREFIXES
mm.insert(make_pair(FAIL, L"(escape) " + res));
#else
mm.insert(make_pair(FAIL, res));
#endif
if (maxValue > FAIL)
maxValue = FAIL;
}
//Part 11
if (!understandAlways && FindAny(contactData->failure, res)) //failure
{
#ifdef DEBUG_PREFIXES
mm.insert(make_pair(FAIL, L"(failure) " + res));
#else
mm.insert(make_pair(FAIL, res));
#endif
if (maxValue > FAIL)
maxValue = FAIL;
}
}
return wstring();
}
TalkBot::MessageInfo* TalkBot::Reply(MCONTACT contact, wstring incomingMessage, bool saveChoice)
{
wchar_t* str = new wchar_t[incomingMessage.length() + 1];
mir_tstrcpy(str, incomingMessage.c_str());
CharLower(str);
incomingMessage = str;
delete[] str;
ContactData *contactData = contactDatas->GetData(contact);
if (incomingMessage == contactData->lastMessage && GetTickCount() < contactData->lastMessageTime + 30 * 60 * 1000) {
MessageInfo *info;
//only 2-3 repeats
if (contactData->repeatCount < 2 || contactData->repeatCount == 2 && (rand() % 2)) {
const vector& v = mind.GetData()->repeats;
wstring res = v[rand() % v.size()];
#ifdef DEBUG_PREFIXES
info = new MessageInfo(incomingMessage, L"(repeat_norm) " + res);
#else
info = new MessageInfo(incomingMessage, res);
#endif
}
else
#ifdef DEBUG_PREFIXES
info = new MessageInfo(incomingMessage, L"(repeat_silence)");
#else
info = new MessageInfo(incomingMessage, L"");
#endif
if (saveChoice)
RecordAnswer(contactData, *info);
contactDatas->PutData(contact);
return info;
}
multimap mm;
Level maxValue = NOTHING;
wstring res = AllReplies(incomingMessage, contactData, maxValue, mm);
if (!res.empty()) {
UpdateStartChar(res);
#ifdef DEBUG_PREFIXES
MessageInfo *info = new MessageInfo(incomingMessage, L"(widelyused_all) " + res);
#else
MessageInfo *info = new MessageInfo(incomingMessage, res);
#endif
if (saveChoice)
RecordAnswer(contactData, *info);
contactDatas->PutData(contact);
return info;
}
incomingMessage = ReplaceAliases(incomingMessage);
res = AllReplies(incomingMessage, contactData, maxValue, mm);
if (!res.empty()) {
UpdateStartChar(res);
#ifdef DEBUG_PREFIXES
MessageInfo *info = new MessageInfo(incomingMessage, L"(widelyused_all) " + res);
#else
MessageInfo *info = new MessageInfo(incomingMessage, res);
#endif
if (saveChoice)
RecordAnswer(contactData, *info);
contactDatas->PutData(contact);
return info;
}
//Also does Part 12
wstring final = ChooseResult(contactData, maxValue, mm);
MessageInfo *info = new MessageInfo(incomingMessage, final);
UpdateStartChar(final);
if (saveChoice)
RecordAnswer(contactData, *info);
contactDatas->PutData(contact);
return info;
}
bool TalkBot::FindExact(ContactData *contactData, const wstring &incomingMessage,
const multimap &map, wstring &res)
{
int max = (int)map.count(incomingMessage);
if (!max) {
wchar_t c = incomingMessage[incomingMessage.length() - 1];
if (c != '?' && c != '.' && c != '!')
return FindExact(contactData, incomingMessage + L'.', map, res);
return false;
}
pair range = map.equal_range(incomingMessage);
for (mm_cit it = range.first; it != range.second; ++it)
contactData->chooser.AddChoice((*it).second);
res = contactData->chooser.Choose();
return true;
}
void TalkBot::AnswerGiven(MCONTACT contact, const TalkBot::MessageInfo& info)
{
ContactData *contactData = contactDatas->GetData(contact);
RecordAnswer(contactData, info);
contactDatas->PutData(contact);
}
void TalkBot::RecordAnswer(ContactData *contactData, const TalkBot::MessageInfo& info)
{
contactData->chooser.SaveChoice(info.Answer);
if (contactData->lastMessage == info.Question)
contactData->repeatCount++;
else
contactData->repeatCount = 0;
contactData->lastMessageTime = GetTickCount();
contactData->lastMessage = info.Question;
}
bool TalkBot::FindAny(ValueChooser<> &ch, wstring& res)
{
if (!ch.GetContainer().size())
return false;
res = ch.GetString();
return true;
}
void TalkBot::SplitSectences(const wstring &incomingMessage, vector& vec)
{
//FIXME: (THINK ABOUT IT:-))these chars not always mark the end of sentence.
const wchar_t symbols[] = L".?!";
int it = 0, len = (int)incomingMessage.length();
while (it != len) {
while (it != len && iswspace(incomingMessage[it]))
it++;
int start = it;
while (it != len) {
if (wcschr(symbols, incomingMessage[it++])) {
//Test for a :-! smile
if (it > 2 && incomingMessage[it - 1] == '!'
&& incomingMessage[it - 2] == '-'
&& incomingMessage[it - 3] == ':')
continue;
while (it != len && wcschr(symbols, incomingMessage[it]))
it++;
break;
}
}
vec.insert(vec.end(), incomingMessage.substr(start, it - start));
}
}
#ifdef _DEBUG
wstring LevelToStr(TalkBot::Level target)
{
wstring lev;
switch (target) {
case TalkBot::BEST: lev = L"BEST(0)"; break;
case TalkBot::LOOKSLIKE: lev = L"LOOKSLIKE(1)"; break;
case TalkBot::BAD: lev = L"BAD(2)"; break;
case TalkBot::FAIL: lev = L"FAIL(3)"; break;
case TalkBot::NOTHING: lev = L"NOTHING(4)"; break;
}
return lev;
}
#endif
wstring TalkBot::ChooseResult(ContactData *contactData, Level maxValue, const multimap &mm)
{
#ifdef DEBUG_SHOW_VARIANTS
AddBotMessage(L">>Availabe:");
for (multimap::iterator it = mm.begin(); it != mm.end(); it++)
AddBotMessage(LevelToStr((*it).first) + L": " + (*it).second);
AddBotMessage(L">>Result:");
#endif
if (maxValue == NOTHING)
return L"";
Level target = maxValue;
typedef multimap::const_iterator lt_cit;
pair range = mm.equal_range(target);
for (lt_cit it = range.first; it != range.second; ++it)
contactData->chooser.AddChoice((*it).second);
#ifdef DEBUG_SHOW_LEVEL
wstring lev = LevelToStr(target);
return lev + L": " + contactData->chooser.Choose();
#else
return contactData->chooser.Choose();
#endif
}
void TalkBot::FindByKeywords(ContactData *contactData, const vector &keywords, wstring& res/*, wstring& ures*/,
bool isQuestion)
{
if (keywords.size() == 0)
return;
const multimap &keys = isQuestion ? mind.GetData()->qkeywords :
mind.GetData()->keywords;
for (multimap::const_iterator it = keys.begin(); it != keys.end(); ++it) {
float prio;
if ((*it).first.MatchesAll(keywords/*, strict*/, prio))
#ifdef DEBUG_SHOW_SOLUTION_REASON
contactData->chooser.AddChoice((wstring)(*it).first + L": - " + (*it).second, prio);
#else
contactData->chooser.AddChoice((*it).second, prio);
#endif
}
res = contactData->chooser.Choose();
}
bool TalkBot::FindByOthers(ContactData *contactData, const vector &otherwords, wstring& res, bool isQuestion)
{
//vector results;
const multimap &specs = isQuestion ? mind.GetData()->qspecialEscapes :
mind.GetData()->specialEscapes;
for (multimap::const_iterator it = specs.begin();
it != specs.end(); ++it)
if ((*it).first.MatchesAny(otherwords)) {
#ifdef DEBUG_SHOW_SOLUTION_REASON
contactData->chooser.AddChoice((wstring)(*it).first + L": - " + (*it).second);
#else
contactData->chooser.AddChoice((*it).second);
#endif
}
res = contactData->chooser.Choose();
if (res.empty())
return false;
return true;
}
const Mind& TalkBot::GetMind() const
{
return mind;
}
void TalkBot::SplitAndSortWords(wstring sentence, vector& keywords,
vector& otherwords, bool& isQuestion)
{
const wchar_t dividers[] = L" \t\n\r,./?\\|;:'\"~!#^&*()_-+=[{]}—";
int len = (int)sentence.length();
vector words;
map sm;
//Find smiles
for (size_t i = 0; i < sentence.length() - 1; i++) {
unsigned max = (int)(sentence.length() - i);
if (max > mind.GetData()->maxSmileLen)
max = mind.GetData()->maxSmileLen;
for (unsigned j = max; j > 0; j--) {
wstring item = sentence.substr(i, j);
if (mind.GetData()->smiles.find(item)
!= mind.GetData()->smiles.end()) {
sm[i] = item;
sentence.replace(i, j, L" ");
break;
}
}
}
len = (int)sentence.length();
bool hadQuestionSigns = false;
for (int it = 0; it != len;) {
while (it != len && wcschr(dividers, sentence[it])) {
if (sentence[it] == '?')
hadQuestionSigns = true;
map::iterator smit;
if (iswspace(sentence[it]) && (smit = sm.find(it)) != sm.end())
words.push_back((*smit).second);
it++;
}
if (it == len)
break;
hadQuestionSigns = false;
int start = it;
while (true) {
while (it != len && !wcschr(dividers, sentence[it]))
it++;
if (it == len || sentence[it] != '-')
break;
// If we have-a-word-with-minus, we shouldn't split it
if (wcschr(dividers, sentence[it + 1]))
break;
it += 2;
}
wstring str = sentence.substr(start, it - start);
words.push_back(str);
}
isQuestion = hadQuestionSigns;
for (vector::iterator it = words.begin(); it != words.end(); ++it) {
if (!isQuestion)
if (mind.GetData()->question.find(*it) != mind.GetData()->question.end())
isQuestion = true;
if (mind.GetData()->special.find(*it) != mind.GetData()->special.end())
otherwords.push_back(*it);
#ifdef EXCLUDE_SPECIAL_WORDS
else
#endif
keywords.push_back(*it);
}
}
void TalkBot::SetSilent(const bool isSilent)
{
beSilent = isSilent;
}
void TalkBot::SetLowercase(const bool isLowercase)
{
makeLowercase = isLowercase;
}
void TalkBot::SetUnderstandAlways(const bool _understandAlways)
{
this->understandAlways = _understandAlways;
}