Created
March 11, 2019 21:41
-
-
Save easrng/b331f42f0d581f5ce7073db06c3d1474 to your computer and use it in GitHub Desktop.
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
/* | |
elizabot.js v.1.1 - ELIZA JS library (N.Landsteiner 2005) | |
Eliza is a mock Rogerian psychotherapist. | |
Original program by Joseph Weizenbaum in MAD-SLIP for "Project MAC" at MIT. | |
cf: Weizenbaum, Joseph "ELIZA - A Computer Program For the Study of Natural Language | |
Communication Between Man and Machine" | |
in: Communications of the ACM; Volume 9 , Issue 1 (January 1966): p 36-45. | |
JavaScript implementation by Norbert Landsteiner 2005; <http://www.masserk.at> | |
synopsis: | |
new ElizaBot( <random-choice-disable-flag> ) | |
ElizaBot.prototype.transform( <inputstring> ) | |
ElizaBot.prototype.getInitial() | |
ElizaBot.prototype.getFinal() | |
ElizaBot.prototype.reset() | |
usage: var eliza = new ElizaBot(); | |
var initial = eliza.getInitial(); | |
var reply = eliza.transform(inputstring); | |
if (eliza.quit) { | |
// last user input was a quit phrase | |
} | |
// method `transform()' returns a final phrase in case of a quit phrase | |
// but you can also get a final phrase with: | |
var final = eliza.getFinal(); | |
// other methods: reset memory and internal state | |
eliza.reset(); | |
// to set the internal memory size override property `memSize': | |
eliza.memSize = 100; // (default: 20) | |
// to reproduce the example conversation given by J. Weizenbaum | |
// initialize with the optional random-choice-disable flag | |
var originalEliza = new ElizaBot(true); | |
`ElizaBot' is also a general chatbot engine that can be supplied with any rule set. | |
(for required data structures cf. "elizadata.js" and/or see the documentation.) | |
data is parsed and transformed for internal use at the creation time of the | |
first instance of the `ElizaBot' constructor. | |
vers 1.1: lambda functions in RegExps are currently a problem with too many browsers. | |
changed code to work around. | |
*/ | |
function ElizaBot(noRandomFlag) { | |
this.noRandom= (noRandomFlag)? true:false; | |
this.capitalizeFirstLetter=true; | |
this.debug=false; | |
this.memSize=20; | |
this.version="1.1 (original)"; | |
if (!this._dataParsed) this._init(); | |
this.reset(); | |
} | |
ElizaBot.prototype.reset = function() { | |
this.quit=false; | |
this.mem=[]; | |
this.lastchoice=[]; | |
for (var k=0; k<elizaKeywords.length; k++) { | |
this.lastchoice[k]=[]; | |
var rules=elizaKeywords[k][2]; | |
for (var i=0; i<rules.length; i++) this.lastchoice[k][i]=-1; | |
} | |
} | |
ElizaBot.prototype._dataParsed = false; | |
ElizaBot.prototype._init = function() { | |
// install ref to global object | |
var global=ElizaBot.prototype.global=self; | |
// parse data and convert it from canonical form to internal use | |
// prodoce synonym list | |
var synPatterns={}; | |
if ((global.elizaSynons) && (typeof elizaSynons == 'object')) { | |
for (var i in elizaSynons) synPatterns[i]='('+i+'|'+elizaSynons[i].join('|')+')'; | |
} | |
// check for keywords or install empty structure to prevent any errors | |
if ((!global.elizaKeywords) || (typeof elizaKeywords.length == 'undefined')) { | |
elizaKeywords=[['###',0,[['###',[]]]]]; | |
} | |
// 1st convert rules to regexps | |
// expand synonyms and insert asterisk expressions for backtracking | |
var sre=/@(\S+)/; | |
var are=/(\S)\s*\*\s*(\S)/; | |
var are1=/^\s*\*\s*(\S)/; | |
var are2=/(\S)\s*\*\s*$/; | |
var are3=/^\s*\*\s*$/; | |
var wsre=/\s+/g; | |
for (var k=0; k<elizaKeywords.length; k++) { | |
var rules=elizaKeywords[k][2]; | |
elizaKeywords[k][3]=k; // save original index for sorting | |
for (var i=0; i<rules.length; i++) { | |
var r=rules[i]; | |
// check mem flag and store it as decomp's element 2 | |
if (r[0].charAt(0)=='$') { | |
var ofs=1; | |
while (r[0].charAt[ofs]==' ') ofs++; | |
r[0]=r[0].substring(ofs); | |
r[2]=true; | |
} | |
else { | |
r[2]=false; | |
} | |
// expand synonyms (v.1.1: work around lambda function) | |
var m=sre.exec(r[0]); | |
while (m) { | |
var sp=(synPatterns[m[1]])? synPatterns[m[1]]:m[1]; | |
r[0]=r[0].substring(0,m.index)+sp+r[0].substring(m.index+m[0].length); | |
m=sre.exec(r[0]); | |
} | |
// expand asterisk expressions (v.1.1: work around lambda function) | |
if (are3.test(r[0])) { | |
r[0]='\\s*(.*)\\s*'; | |
} | |
else { | |
m=are.exec(r[0]); | |
if (m) { | |
var lp=''; | |
var rp=r[0]; | |
while (m) { | |
lp+=rp.substring(0,m.index+1); | |
if (m[1]!=')') lp+='\\b'; | |
lp+='\\s*(.*)\\s*'; | |
if ((m[2]!='(') && (m[2]!='\\')) lp+='\\b'; | |
lp+=m[2]; | |
rp=rp.substring(m.index+m[0].length); | |
m=are.exec(rp); | |
} | |
r[0]=lp+rp; | |
} | |
m=are1.exec(r[0]); | |
if (m) { | |
var lp='\\s*(.*)\\s*'; | |
if ((m[1]!=')') && (m[1]!='\\')) lp+='\\b'; | |
r[0]=lp+r[0].substring(m.index-1+m[0].length); | |
} | |
m=are2.exec(r[0]); | |
if (m) { | |
var lp=r[0].substring(0,m.index+1); | |
if (m[1]!='(') lp+='\\b'; | |
r[0]=lp+'\\s*(.*)\\s*'; | |
} | |
} | |
// expand white space | |
r[0]=r[0].replace(wsre, '\\s+'); | |
wsre.lastIndex=0; | |
} | |
} | |
// now sort keywords by rank (highest first) | |
elizaKeywords.sort(this._sortKeywords); | |
// and compose regexps and refs for pres and posts | |
ElizaBot.prototype.pres={}; | |
ElizaBot.prototype.posts={}; | |
if ((global.elizaPres) && (elizaPres.length)) { | |
var a=new Array(); | |
for (var i=0; i<elizaPres.length; i+=2) { | |
a.push(elizaPres[i]); | |
ElizaBot.prototype.pres[elizaPres[i]]=elizaPres[i+1]; | |
} | |
ElizaBot.prototype.preExp = new RegExp('\\b('+a.join('|')+')\\b'); | |
} | |
else { | |
// default (should not match) | |
ElizaBot.prototype.preExp = /####/; | |
ElizaBot.prototype.pres['####']='####'; | |
} | |
if ((global.elizaPosts) && (elizaPosts.length)) { | |
var a=new Array(); | |
for (var i=0; i<elizaPosts.length; i+=2) { | |
a.push(elizaPosts[i]); | |
ElizaBot.prototype.posts[elizaPosts[i]]=elizaPosts[i+1]; | |
} | |
ElizaBot.prototype.postExp = new RegExp('\\b('+a.join('|')+')\\b'); | |
} | |
else { | |
// default (should not match) | |
ElizaBot.prototype.postExp = /####/; | |
ElizaBot.prototype.posts['####']='####'; | |
} | |
// check for elizaQuits and install default if missing | |
if ((!global.elizaQuits) || (typeof elizaQuits.length == 'undefined')) { | |
elizaQuits=[]; | |
} | |
// done | |
ElizaBot.prototype._dataParsed=true; | |
} | |
ElizaBot.prototype._sortKeywords = function(a,b) { | |
// sort by rank | |
if (a[1]>b[1]) return -1 | |
else if (a[1]<b[1]) return 1 | |
// or original index | |
else if (a[3]>b[3]) return 1 | |
else if (a[3]<b[3]) return -1 | |
else return 0; | |
} | |
ElizaBot.prototype.transform = function(text) { | |
var rpl=''; | |
this.quit=false; | |
// unify text string | |
text=text.toLowerCase(); | |
text=text.replace(/@#\$%\^&\*\(\)_\+=~`\{\[\}\]\|:;<>\/\\\t/g, ' '); | |
text=text.replace(/\s+-+\s+/g, '.'); | |
text=text.replace(/\s*[,\.\?!;]+\s*/g, '.'); | |
text=text.replace(/\s*\bbut\b\s*/g, '.'); | |
text=text.replace(/\s{2,}/g, ' '); | |
// split text in part sentences and loop through them | |
var parts=text.split('.'); | |
for (var i=0; i<parts.length; i++) { | |
var part=parts[i]; | |
if (part!='') { | |
// check for quit expression | |
for (var q=0; q<elizaQuits.length; q++) { | |
if (elizaQuits[q]==part) { | |
this.quit=true; | |
return this.getFinal(); | |
} | |
} | |
// preprocess (v.1.1: work around lambda function) | |
var m=this.preExp.exec(part); | |
if (m) { | |
var lp=''; | |
var rp=part; | |
while (m) { | |
lp+=rp.substring(0,m.index)+this.pres[m[1]]; | |
rp=rp.substring(m.index+m[0].length); | |
m=this.preExp.exec(rp); | |
} | |
part=lp+rp; | |
} | |
this.sentence=part; | |
// loop trough keywords | |
for (var k=0; k<elizaKeywords.length; k++) { | |
if (part.search(new RegExp('\\b'+elizaKeywords[k][0]+'\\b', 'i'))>=0) { | |
rpl = this._execRule(k); | |
} | |
if (rpl!='') return rpl; | |
} | |
} | |
} | |
// nothing matched try mem | |
rpl=this._memGet(); | |
// if nothing in mem, so try xnone | |
if (rpl=='') { | |
this.sentence=' '; | |
var k=this._getRuleIndexByKey('xnone'); | |
if (k>=0) rpl=this._execRule(k); | |
} | |
// return reply or default string | |
return (rpl!='')? rpl : 'I am at a loss for words.'; | |
} | |
ElizaBot.prototype._execRule = function(k) { | |
var rule=elizaKeywords[k]; | |
var decomps=rule[2]; | |
var paramre=/\(([0-9]+)\)/; | |
for (var i=0; i<decomps.length; i++) { | |
var m=this.sentence.match(decomps[i][0]); | |
if (m!=null) { | |
var reasmbs=decomps[i][1]; | |
var memflag=decomps[i][2]; | |
var ri= (this.noRandom)? 0 : Math.floor(Math.random()*reasmbs.length); | |
if (((this.noRandom) && (this.lastchoice[k][i]>ri)) || (this.lastchoice[k][i]==ri)) { | |
ri= ++this.lastchoice[k][i]; | |
if (ri>=reasmbs.length) { | |
ri=0; | |
this.lastchoice[k][i]=-1; | |
} | |
} | |
else { | |
this.lastchoice[k][i]=ri; | |
} | |
var rpl=reasmbs[ri]; | |
if (this.debug) alert('match:\nkey: '+elizaKeywords[k][0]+ | |
'\nrank: '+elizaKeywords[k][1]+ | |
'\ndecomp: '+decomps[i][0]+ | |
'\nreasmb: '+rpl+ | |
'\nmemflag: '+memflag); | |
if (rpl.search('^goto ', 'i')==0) { | |
ki=this._getRuleIndexByKey(rpl.substring(5)); | |
if (ki>=0) return this._execRule(ki); | |
} | |
// substitute positional params (v.1.1: work around lambda function) | |
var m1=paramre.exec(rpl); | |
if (m1) { | |
var lp=''; | |
var rp=rpl; | |
while (m1) { | |
var param = m[parseInt(m1[1])]; | |
// postprocess param | |
var m2=this.postExp.exec(param); | |
if (m2) { | |
var lp2=''; | |
var rp2=param; | |
while (m2) { | |
lp2+=rp2.substring(0,m2.index)+this.posts[m2[1]]; | |
rp2=rp2.substring(m2.index+m2[0].length); | |
m2=this.postExp.exec(rp2); | |
} | |
param=lp2+rp2; | |
} | |
lp+=rp.substring(0,m1.index)+param; | |
rp=rp.substring(m1.index+m1[0].length); | |
m1=paramre.exec(rp); | |
} | |
rpl=lp+rp; | |
} | |
rpl=this._postTransform(rpl); | |
if (memflag) this._memSave(rpl) | |
else return rpl; | |
} | |
} | |
return ''; | |
} | |
ElizaBot.prototype._postTransform = function(s) { | |
// final cleanings | |
s=s.replace(/\s{2,}/g, ' '); | |
s=s.replace(/\s+\./g, '.'); | |
if ((this.global.elizaPostTransforms) && (elizaPostTransforms.length)) { | |
for (var i=0; i<elizaPostTransforms.length; i+=2) { | |
s=s.replace(elizaPostTransforms[i], elizaPostTransforms[i+1]); | |
elizaPostTransforms[i].lastIndex=0; | |
} | |
} | |
// capitalize first char (v.1.1: work around lambda function) | |
if (this.capitalizeFirstLetter) { | |
var re=/^([a-z])/; | |
var m=re.exec(s); | |
if (m) s=m[0].toUpperCase()+s.substring(1); | |
} | |
return s; | |
} | |
ElizaBot.prototype._getRuleIndexByKey = function(key) { | |
for (var k=0; k<elizaKeywords.length; k++) { | |
if (elizaKeywords[k][0]==key) return k; | |
} | |
return -1; | |
} | |
ElizaBot.prototype._memSave = function(t) { | |
this.mem.push(t); | |
if (this.mem.length>this.memSize) this.mem.shift(); | |
} | |
ElizaBot.prototype._memGet = function() { | |
if (this.mem.length) { | |
if (this.noRandom) return this.mem.shift(); | |
else { | |
var n=Math.floor(Math.random()*this.mem.length); | |
var rpl=this.mem[n]; | |
for (var i=n+1; i<this.mem.length; i++) this.mem[i-1]=this.mem[i]; | |
this.mem.length--; | |
return rpl; | |
} | |
} | |
else return ''; | |
} | |
ElizaBot.prototype.getFinal = function() { | |
if (!ElizaBot.prototype.global.elizaFinals) return ''; | |
return elizaFinals[Math.floor(Math.random()*elizaFinals.length)]; | |
} | |
ElizaBot.prototype.getInitial = function() { | |
if (!ElizaBot.prototype.global.elizaInitials) return ''; | |
return elizaInitials[Math.floor(Math.random()*elizaInitials.length)]; | |
} | |
// fix array.prototype methods (push, shift) if not implemented (MSIE fix) | |
if (typeof Array.prototype.push == 'undefined') { | |
Array.prototype.push=function(v) { return this[this.length]=v; }; | |
} | |
if (typeof Array.prototype.shift == 'undefined') { | |
Array.prototype.shift=function() { | |
if (this.length==0) return null; | |
var e0=this[0]; | |
for (var i=1; i<this.length; i++) this[i-1]=this[i]; | |
this.length--; | |
return e0; | |
}; | |
} | |
// eof |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment