From 5a562d12938da08b53e5b0e69b34ecc5b6baa573 Mon Sep 17 00:00:00 2001
From: Sweta Vooda <sweta.vooda@gmail.com>
Date: Thu, 25 Jan 2024 20:15:12 -0500
Subject: [PATCH] added open-ai integration

---
 .gitignore                       |   6 +
 README.md                        |  51 ++++-
 langcache/__init__.py            |   0
 langcache/adapter/openai.py      |  24 ++
 langcache/core.py                |   7 +-
 langcache/evadb_data/evadb.db    | Bin 0 -> 135168 bytes
 langcache/statistics/__init__.py |   0
 requirements.txt                 | 131 +++++++++++
 setup.py                         |  27 +++
 test/open-ai-integration.ipynb   | 379 +++++++++++++++++++++++++++++++
 10 files changed, 621 insertions(+), 4 deletions(-)
 create mode 100644 langcache/__init__.py
 create mode 100644 langcache/adapter/openai.py
 create mode 100644 langcache/evadb_data/evadb.db
 create mode 100644 langcache/statistics/__init__.py
 create mode 100644 requirements.txt
 create mode 100644 setup.py
 create mode 100644 test/open-ai-integration.ipynb

diff --git a/.gitignore b/.gitignore
index 68bc17f..e7449a9 100644
--- a/.gitignore
+++ b/.gitignore
@@ -25,6 +25,11 @@ share/python-wheels/
 .installed.cfg
 *.egg
 MANIFEST
+langcache-venv/*
+langcache/.DS_Store
+test/.DS_Store
+.DS_Store
+.vscode/*
 
 # PyInstaller
 #  Usually these files are written by a python script from a template
@@ -50,6 +55,7 @@ coverage.xml
 .hypothesis/
 .pytest_cache/
 cover/
+test/evadb_data/*
 
 # Translations
 *.mo
diff --git a/README.md b/README.md
index cb1ab55..895b477 100644
--- a/README.md
+++ b/README.md
@@ -1 +1,50 @@
-# langcache
\ No newline at end of file
+# langcache
+LangCache is a semantic caching library developed for Large Language Model (LLM) queries. Its primary purpose is to address the cost concerns associated with LLM API calls and to improve the speed of LLM applications. 
+
+### Installation of langcache for developer setup
+To install langcache, we recommend using the pip package manager.
+
+1. Create a new virtual environment called langcache-venv.
+```python -m venv langcache-venv```
+
+2. Now, activate the virtual environment:
+```source langcache-venv/bin/activate```
+
+3. Install the dependecies
+```pip install .```
+
+### OpenAI ChatGPT 3.5 ChatCompletion API usage with langcache enabled
+
+Before running the example, make sure the `OPENAI_API_KEY` environment variable is set by executing `echo $OPENAI_API_KEY`.
+If it is not already set, it can be set by using `export OPENAI_API_KEY=YOUR_API_KEY` on Unix/Linux/MacOS systems or `set OPENAI_API_KEY=YOUR_API_KEY` on Windows systems.
+
+#### OpenAI API original usage
+```
+import openai
+
+question = "What is ChatGPT?"
+completion = client.chat.completions.create(
+   model="gpt-3.5-turbo",
+   messages=[
+     {"role": "system", "content":"You are an helpful assistant to answer all my questions within 15 words limit"},
+     {"role": "user", "content": question}
+   ]
+ )
+```
+#### OpenAI API + LangCache, similar search cache
+```
+from langcache.adapter.openai import OpenAI
+from langcache.core import Cache
+
+cache = Cache(tune_frequency=5, tune_policy="recall")
+client = OpenAI(cache)
+
+question = "What is ChatGPT?"
+completion = client.chat.completions.create(
+   model="gpt-3.5-turbo",
+   messages=[
+     {"role": "system", "content":"You are an helpful assistant to answer all my questions within 15 words limit"},
+     {"role": "user", "content": question}
+   ]
+ )
+```
diff --git a/langcache/__init__.py b/langcache/__init__.py
new file mode 100644
index 0000000..e69de29
diff --git a/langcache/adapter/openai.py b/langcache/adapter/openai.py
new file mode 100644
index 0000000..025792e
--- /dev/null
+++ b/langcache/adapter/openai.py
@@ -0,0 +1,24 @@
+import openai
+from ..core import Cache
+
+class LangCacheCompletions(openai.resources.chat.completions.Completions):
+    # TODO: Add remaining args
+    def create(self, messages, model):
+        # Get the last message with role "user"
+        last_user_message = [message for message in messages if message["role"] == "user"][-1]["content"]
+        cached_value = self._client.cache.get(last_user_message)
+
+        if cached_value is None:
+            llm_output = openai.resources.chat.completions.Completions.create(self, messages=messages, model=model).choices[0].message.content
+            self._client.cache.put(last_user_message, llm_output)
+            return llm_output
+        else:
+            return cached_value
+
+
+class OpenAI(openai.OpenAI):
+    # TODO: Add remaining args
+    def __init__(self, cache):
+        super(OpenAI, self).__init__()
+        self.cache = cache
+        self.chat.completions = LangCacheCompletions(self)
diff --git a/langcache/core.py b/langcache/core.py
index 35b7621..7107ffe 100644
--- a/langcache/core.py
+++ b/langcache/core.py
@@ -1,6 +1,6 @@
 import os
 import evadb
-import openai
+from openai import OpenAI
 import string
 import random
 import multiprocessing as mp
@@ -17,6 +17,7 @@
 class Cache:
     def __init__(self, name=None, tune_frequency=5, tune_policy="precision"):
         self.cursor = evadb.connect().cursor()
+        self.client = OpenAI()
 
         # Setup needed functions.
         self.cursor.query(
@@ -72,7 +73,7 @@ def _evaluate_and_tune(self, key: str, ret_key: str, distance: float, **kwargs):
             # LLM tuning.
             self.llm_msg[1]["content"] = f""" "{ret_key}" , "{key}" """
             response = (
-                openai.ChatCompletion.create(
+                self.client.chat.completions.create(
                     model="gpt-3.5-turbo",
                     messages=self.llm_msg,
                 )
@@ -165,4 +166,4 @@ def put(self, key: str, value: str):
                 f"""
                 INSERT INTO {self.cache_name} (key, value) VALUES ("{key}", "{value}")
             """
-            ).df()
+            ).df()
\ No newline at end of file
diff --git a/langcache/evadb_data/evadb.db b/langcache/evadb_data/evadb.db
new file mode 100644
index 0000000000000000000000000000000000000000..a35eb7ed5c83034045bafc11b344da19eb3d07d2
GIT binary patch
literal 135168
zcmeI531A!5nSeDqJ+`EY?bxzoLS&l|i#Ul6%d%ok62(@6i7h8SLXsAyV`*e7u_Z-E
z5{J-W#|b1GpcK;r%~Fn~T!pewwtzL+blZkNTe^k9(gH0<p=AkeflbSXYu_84BiRWM
zb7g-ewl)8I^S}Rn|2zK~jk?#g`=gxR7Yq-vQN2YnLqZUeWqQ3tB56ZE)#xYnDn)PP
zsRQ(v$a+83+cwF<@Qn(bnR*xJsifZ3?pB92twrn9Ch~AmHF<$*A6cPzUDYA)QCus1
zOs*psqJpTHO5tZEca<x3>n()DAMkS9BAW*hB!-PegTgVhG1$ip_#@F^c$o39QFbuc
z&zL3=>P81<s&qCRF&2!neS@4Y7Vt#<!2sh4Mxv=RCl!{pbh(^8E`5)4dAmzLX%>B5
zA(>9_d-ZMZ9@k1&SG~TF46s9-eyy{s<y>c1oypu}z(QQ6enoqyvj-nB;ow##bC%xS
z*`s&&wzuQ7)m?2J&aU<PRj&2=x@1N{#fr`@SKCTAPN>T&+Mw@pt#Ea@+%2x|EL#&`
zG8*)qZhfn(-G!>v;_Pm5wz_a(**dY^CsCHjlBcQAFnV5zN@p+-W1TsuS<gTgczjek
z1zenlsZNS7tG?N&J@_Oh#6}0wz|Gc1ffgI?kEDerqq#wlej@O_?zT0(E`1%gtUiO-
z@BLKVQfO!{Rq8qoQ#JoIibUm2;^Ud4&KWA*(xt>$vDgzsT$J^qMv>R>a}$au_fKv%
z?5dhg+;B}6WTOCN3p*Ig>HsP9X*)CR{u6hFlt%;urrRZjhBd`X9k=wP4#-8qWPFjE
zR5HqF6CGq&aEm867#l((QKFZMk0_A?#A*2*#F&5{9S&uf+XO%OBTOJRIEaTn{qoMv
zc9+wQfwSQ-JIsjkCx)m*g4aL91tMse%<etOGO((wVe6FLm*`Le5TrJ*H>DG@N4SJA
z2`)3dp<Y9ssMm-wGA8lyj9o=)mCj@$b~^?AskZ75rd*US(TLoXpZ>YJ3i;k22*sk=
zj!&65{T|HHoae;sv}`}7<&(IwMWfW6Z#r53%Qz>~@iH=Pf00Tzzm^!$BvuUpZd;TI
z#{!58T2$cWLb70W(vNNKR@XW`BhH6s&8)m=4!~+6Xx8z@201TQXc%2bs&uur#MoA$
z?PO)odRr)JEm;XuHj~XUF6`&hy->79h(y_Nl!>CQs&7RLm7cZ^VK(OiUM3n5iNain
zW230jQ7()I=IqInMXRALqM;$baw1)xFj9pojn=B!rN%;NUdb1q@>FXmG*}Cjy0+S>
z8bTJu!~!ts(V~&HDwS@*0%DXAJc6gaJ~qOoJf3@8Ao5La>XZ)R0{#9#X3#YyN8%70
zW{1*ltDC;12ja1`K&k6qFcptn%NbLygdFKq2utEoS|H;I27LbhSeQ+$i&L}FBtoT#
z(WK{LP#<eWa7ryiC<!5HQz~^A*rq}<siAoEpQMVak%&yCn>UZxHCKQm{7SVM(Sck9
zLzFaSYw`Kf+!+fG<}H`}UM>*z`}|xOZA|d0ATLLv0MU$XHVXsoDG?MF^MwYxT&e4r
zHx)op<rtIbP%#oEgnqWGN|5Ic>AA;J5w_gad~(UHlYb~Q$O!mE3;op2O2j24L<6*E
zQzSN&W@$A|AF-v<6ZOK}dSxc3R9liI_R$p@4SGY8+a=T@?FP*?>gUy!Md8AS3w1~Y
zFCYK}fB+Bx0zd!=0D);GFfxl&%^&HNbV$0<>YEFAxD{w`8w+!bdLvvovM90@g-f>t
zgI;#g)?j#3B*c2SMT2ahzXeB}g?B>uHS68Ng;@uwMIh3Y)X(@51uP5=dpWDcYw2t9
zdN@;~hclb(oY&W2v$34f?(=#rBl-fBZX||`Yh?!qU7y&b1zWhlmPLd9zD1$o=s+-F
zS!gmXilB=r3s7}7vHe_R5x0f)_ASa->qP}}$izllBj@$nJPkIV*KBXJHQCJ;ua`4g
z8?08=*JK{Cs#Nnwi!eW7>EG)2`C>R~_*oi@q98aR=}nc5?6&yqW~<%oVNIOZ=(GFm
z_&wWbH#M5gtjTO1IZLUk8W~1*w+yh+m8*L`OM5-2$o^0inc2izn;NZ64P2kq;xSqp
zZC;KuvJH(kJ8A*8#)c86LRCFV%}03sL;gWF?2itAmX-#*LNFLLmQ?A;Xm>)mB6%6j
zX0=&OM!VT&YhW#QZy#rFY%-cXsBtvnCT$zB%2j2fGE|3_a4__FSnomQ=G$%Z`K(r>
zsnKGz*nNFA)@<`NSdD#_#s=1C_L=)emdg<PVq~`yN6K4*u|V|mus#uv_u%65E8%Sv
zs9WuvvCnJqu#J5UrY4W4(b8b*v-eqzBVAIJeYDEZAz8sjqFpU+cW2*5&J%6rqUd)p
z{8?7Whb#zt0s$r{n80|GHlSLy46>03ihZEK9U43O`m7CRv)RJ-aaN<vZf@)|`z&_O
z(`fTqj3$$P#7(HIqdHWnjsUv;+ct!Tu#^VwGp*7PE}!vZ0~k-T4qP~|LUuFDdMzfe
zk3%)!>>iKFWA)f9T$9maGFn+vA)3=jYCu9Aq^_qPpmtEdr2b3|P~W5WOzUI^%76e6
z00KY&2mk>f00e*l5C8%|00{iQAW$lsPvpdTNm8aGgz##CkSdO1s)}S)L^49C)XJ)f
zOc+j4AS)wqL`#n4nGlg|mds8}9&C~7WL9#rkOjW}FV%h^p~lcJcmV+*00e*l5C8%|
z00;m9AOHk_01!AW35>|3D$9sdGGD?C^`X0s{DJ<BzAzUEv3~#dPke*IqJ{=@LlbMV
znvEtSx^KzmMfVh-8zjtTTc5GXXSH|tboI9M^me&g8T2V8=XOF>Ef_H!W!o(_*2;Pt
zn#^{O-Qu--8c~TR6Nl`v*;&q(Q#QW-FQtAbp?*ibby~U@Dg^|901yBIKmZ5;0U!Vb
zfB+Bx0zlxjCZLm9h)JRvQjM&d%mf<n_5WFFy@Yy+dYrnCTB|*-y-I7>Jgphluo}0<
zteLIRsE@0Us-IRLQQxP&UcE;hRkP~z)D7q)cmV+*00e*l5C8%|00;m9AaGg{D48Xn
zTP*2lYhT;j&GdAxa=B}2W>(4#X<6%X#_jBI)zp+#$mge}tDW85=XZ9s*3=a1<h5yW
zZ?~(fre;RDygDQ5YOAR!DZ{0#Zgaa@I^8bD<z8D;Q$AC^AWP<4-NvBDPNULGap|3_
zU2bO^la{JW<fS?Z`mnr@9gJ`@i*cSv(6fn4Jfkugi#8h7GvsAul29-lZ9*S^E~eyV
zb0h=kq1ZLXg~GoYtyW%DD(Mf!(DO+nUol=#s*xKg;kb{DdIp$?e>-QIrIs6JOA>-1
zZb%SXjEPrq5!N{r^l~*}ZjeI{e5@%il-E{C*idLN`4RIP;ei)5Um+E9M&=252hsB*
z!Zn}#a<ib2!4Fzogo_@G)UXALxg!fCsfTJzpZ=7_NX=T6qH3gC5*-RnpLV3IreCR;
zKVp$YEQ~j}H82=tz0;>ZOKGHLg915Vt|ajY>uGa<psr?vT+p3(?CZ4Y7Sz?ulF6;b
z$n3;Z=hKhZjD`KEA4zdP!m<b#jR@ds&LHIWVo9Qn_yg#HCFps~!m~E9T{Zan|19l#
ziFTv*V(ohEO=$Q3wD!l^d#N>)mAa9NQ%_N^QbDSQDyKBmJ=D1rOUbpbQTw%TQkR@o
z107Tb2mk>f00e*l5C8%|00;m9AOHkD8G#wHxkPr@XjX~LkP;+gMwR$u@5wx=fKde{
zt4+ypv`B|P;-1XY+tpT%)n><u%4W(IWCY1@&`eyGI6_pal9duDJXC^{#DSq={Be35
z6`FzH;D8W?KYO1H18MOI_<be>q`@L_07#8b#le>%Y=2g?r%)rCBP0kx9uk|MilN}`
zc>yjd8ADNF99ba>oUX*Dr$ZD9e3T9<$SY)4l$IX{kl|9Yg8<S>nVp<G0)Vgoqc8n~
z7Z3mfKmZ5;0U!VbfB+Bx0zd!=00AIy8WX_R|6%`s8ao)O1_Xcr5C8%|00;m9AOHk_
z01yBIKmZYd>;KRUfB+Bx0zd!=00AHX1b_e#00KY&2%P=|;QIgR?_;PT5C8%|00;m9
zAOHk_01yBIKmZ5;0oeaT8vp`800;m9AOHk_01yBIKmZ5;0U&Vt6TtWX&nh}Dp`M`*
zQCCo#sO40Z_J6d$)lO*lYQLsETk}`VgPQ%CK~0CIUPG$?r2eV;YIR7xRDBjY30^<|
z2mk>f00e*l5C8%|00?|Z2-M9YXIB+e%`PA$K8}sX!d%4N>g?)ru3ypK>FlwX>rC}}
zOH+e^tgIx<stQUek`TUHESamjr^`exst}aSM@rE7p<p1w<tT9n16;j6@!Mi3sMe8{
zNLLlo6$%H3LeY%2Iw6yxU{U$U)2XU1JDE<EekRsgT9$7oss^g4L0MgTG9}76C1e#=
zf^7E$15qxJZ9LX7yO`7^Gi;7=;o+>h;p8)Ckh689qzW0~^`kFh3wSsIb)CgrueTW#
z=TM}*jFeO&{VNh4VO-myVb&83h8Z_I#Pzt=_0*Y+#(IOoswEdxk-GUfZx|&p&M<nq
zJ+mBr@msRg-ZpnnQ=KKn9>YbaX(m0bGsFc>bXt>|wBXW^<t^c0D8zZ0tWr;KrhHxz
z!b(=nL3Z}_1-Iq3u|&gYFvyLCWNm(hPNez_lAKdTN{W$Do48@d6O09-sLrmHuC6+R
ztg?VaE|nCcg1b33jJ~~b6*ug3uSZF9Rk)}soYWQw#i9vz$)Zq}p7pC;IGa*19lI;y
z3Fdc?M01tSQzUALvYoJo(rP)*Sc>%xvVG`l8j~gB7MRp!lzmJH(sC)OLv5z4fJ`VA
znuxjHa5jPZELl}clG%MWRXNlu%uV>mkof*TPC~8JzDNCz3Q(1lk-CZc28sr-+9#=h
zXrtOUv>bH_b(H$0_OSL&?G@S=wLj8+N4t}{|4TB^ftf%62mk>f00e*l5C8%|00;m9
zAn;ic(8^~ML@LNc&MK6b5yJP=k(EM9Dsog%p_W$?L?SL!pcAF3%Cpi`Wui3Y%&atJ
zsYYH!5Xk_IvZP3^BM2cHqbwHAN`+n&GtQ9P31ad{i-IbbFF=Vop%sNTPmDt+3QeWl
zLJ*ULM&xS2v_xP)UQ{fv6)BY$Qt~+jkq%$T$Qkl#g2)6cWCg-0Sz!v9O3;{yNJy1g
z>ZJ<dAQ4-T%5%$-$_nK=k`R)m1@bbI#9tAJum3Bl^Ci@))Z^3-sq4^A|NPIYSwJ~J
z00;m9AOHk_01yBIKmZ5;0U!VbzT^bvDGP*~Yfg4=jZ~+=ccn<GgnJlL_jjNhJfxNK
z0(7&9q?nK};ow%r?@iy@Agz!U;A{Tq-iIyhU@U!C2s*1=if>QBDJZ0nrLBTUC?oTf
z;p_iO>LCgBKhzV{L)7ck5$c66IeRc42mk>f00e*l5C8%|00;m9AOHk_!0AIkxR)Vy
zPlZ%T%1ed&2&4+(_J?H5Kq?om`3qqJS%JKi#J3tqi{w=#naly-|9AQ{38)DW00KY&
z2mk>f00e*l5C8%|00;nqsR+RH|ED4Yav%T%fB+Bx0zd!=00AHX1b_e#00O5E0l5Bu
z`uGxR0tA2n5C8%|00;m9AOHk_01yBIKwv5YaQ%NOG9U*6KmZ5;0U!VbfB+Bx0zd!=
z00AIy`Vhd^{|V|v3HlE&AOHk_01yBIKmZ5;0U!VbfB+Bx0zlx)N?<mjAm*ziWH%Rx
zasdyQ{Jz7bd)p#2P@UlZ|1Ya!!EPV`1b_e#00KY&2mk>f00e*l5C8%nodDeb|It}N
zP9OjTfB+Bx0zd!=00AHX1b_e#00LiD0vhTaiAJ?gqCG_YNOPrjw>qq8En25Gk%x<_
z$qQ8b$O^^lst$RN;#%oravi}C6-33CwXPq>ZdbWdx86cX`~fewEwXvgALSS}77Yr=
z%*J3JGvJRzgW+Mu!$#S`U_WD;M5r4bn5oj)Y{XbF%JvO%zF5E$^#=otCm4yQ&YV<O
z*3#v2_PF#t&gJbc{iIp+b%kU)!SB_#xqDnIU0wD1LNdS(ar(8+u9kD1U3DgNlK~5H
znfev&oz5P7l>Gk3)LD9WXOG_9+un}TR(G{^IJ?&CSGm^f>yjA-6)QTsTx~1eIH4}9
zXoJ4XwZhfqa<{m;vusU($!O4by7jHDb{DEvi?h4M+3LcDW$VOtpF~+AOP;1e!{~V>
zDxJYVjCJOqW<3L0;PFxE6mW4GraCFUtoo*)Ve>usBqqd02hzaJ)<%IA8}5&!g(jo9
zL6CkT@V)M~HN7r<9k#4KgV^u=RNPW%px%*1It^1b|1^q3<xS$_nWN4bD&5kh#8|P|
z6GL2-^`b_R*YI-_iYNC^ZZ_<y8uW#xHCd320ubQ~PqU;+^l3ZAz2%fVA{a2;F2N2U
z-r|;?)B(9jn2axSlS)PzZK8t=3vTfQ2V+BMBueyB@ew6*fH*C`gBTOgqr;)hpkovK
z;EynY*x(=@`t-{?JKJ4OH|{fRILr<+qWp;=Dv{vz4{?DA8YZ)QPqGZGikU|DB|4M<
z1gXvIP3eT}5iTK2g3AnVg@$HIshhgjh%quI@$rmZMQWAKWFmGu1^ubE>JO$|lrPbU
z+?1dGxw;DZ-X93XqS=m5nK=C(%+j3a#O$<eKc?lAxUxl~)SYiSS^vv8C)4pVGHrj6
zN;kij7||qF4FPUjlnKWIhznX&;N?QHV0F@uZSGdrIz1!KhiA>Kyl4)<Y9eUX@x}%@
zFIH$6T}P^PwY9|9R-x@=WzTwBC~7TP2~#$c%`q<Q=hD4Uv_^<T*>IGJqOPiMMGKXl
zwhm!7=K@|P8WD-YT!>?%sM1j`j0WcH$&*E^p)I1JA-{4WU7j#fg(}TPMdDZp%`5rh
zQySQXg+`&lTBy{u)lStAvM44NfJu)QjjUCvbPE;`qm1AYJni+d5iaHN+~Wd~Z*o(o
zbPyNl_XjeAt|>VZhuAPXly+O)^esIMg@&aCN?rGYsd(gC&X{r~<VdGNSQ3xY0vS&*
z;Pdy#!faw)oSKa$5h_KDCOr>>`dBN1Q)(eXNeD@sQmMPZHWiXd4aKAXBvn+6L}V)6
zym`c~xdI&FSE|j34&)*jqNFKXi_eed&RBRbYhjd_RsCLcbGYB<=fY@Xf>#B3IT8hk
zW^A)r7-&z4V6u<d<w{-0yr}?+D#w^ahl-IXA@s9dRf0TsNY6c%im>IT=95cqo%}<g
zK}NtQTIi>CRw6DbAsV1Pn<BBHG)t>#`iL!+o~Re*)+;kPrP`7V?S%{QepsV=LsCqP
zNwha;S<P(qV?`GiEhC>QaHx(c%T<@jHz*#E9+c0K8c`N_eM$sI3}>oz77H<wSeSD|
zeVo_p5A<*Jg}Fe8_4~I^BB~a(<ViAQ#=;)gI$_K2Lvv>=jOO#@?VZc<I{ahz-9p1i
z(QK8jx|$fl6WSn`F){N_FS0C4o*tZ21|_y>siRL|&FF<y!f-iukzh??nU$P^MF(e!
zY!W5qclzWk8ez9^AGOn`A}qp|O1wQub;i^<fWapW@N&Lv;m58&)|4F>$Xoa(cNl12
zlfCQ}?>jR4m;CTdp}~H}iAH7-N5&*NoHM$vQl;zYAjWD1-+0j~5UmZ9g|p~w3Je;P
z@M88P>1T*Mc(UBsskp4%jfS|)oYWM{<canA91|zoASUyEB*55T+0m{^)MxuiY-`3(
zg$8DpQWxo%YQ8)f8?+`n3G3OTL7hssW(_gcmhHQ=K~s9~1UY6+=D!o<7d)6w7k8<A
zaM_!Rv>UU|{%F3;Izi;nv^;O4IBhQVR48>@*PO(qX*=>Akap?`@>HSuOPKVhDY(6>
zyiAz4c6TS{g8ZO3-X7(|$;(CUV3G{j@mMT&IhNqnVrsxdo0`PhmD|R7V#3~GsvT)M
zgRnQv-LQU!JIX|@>h+VEoHuqSGK-oa7Ui|T$wqCs>d>DVF7pB9c3NQ<GR4R%T-!;+
z-3|GgP{^<JL?OR)XPhEX4wo#Z>q=6gVNJ18H{B6)xR4=Qu%w%F&WbWE&l{aiF(wX|
zEW*L9sbyzsU4w_Kdc82^rjoK(mFa}+5iKE{#69r&|4(UC4{Ct`5C8%|00;m9AOHk_
z01yBIKmZ7Qfe66o|Gz-a08@Yf5C8%|00;m9AOHk_01yBIKmZ7QN(A8g|EB~N)B*t@
z00e*l5C8%|00;m9AOHk_01)^B5rFIeUm$0IDL?=S00AHX1b_e#00KY&2mk>f00cfI
z0&xBRQvwTWfdCKy0zd!=00AHX1b_e#00KY&2z-GE!1ezxkTbv(AOHk_01yBIKmZ5;
z0U!VbfB+Bx0-q8AeEnZW-6)}6pbnuw@B#ur00;m9AOHk_01yBIKmZ5;0U!VbJ_iD4
z%H(qmk~Td%q>m18`c2$$`n~Y&>1Rq$l1`jB9q<1Ma+3u8hZhh40zd!=00AHX1c1Qw
z61cpCP|UqvD_YE5qPS*@GEvO_l0a-IG`!Fg408+7TQ2PPjPEaEeBt0wU(Dy@!sAzu
z*L_Qp%x?L|R^B}R%*2Mr7xO(OAH;w9mv+8f_wdBV_qWl?yZarDuN-*T_u7W$n}_D{
zFWj%^M=yG9;-P0(#bsUB(N**Bo;b|BxA@Yl_Bw{=s}2U5OnmFJU*TOtQitK6E{K2g
z<!yZH-|y#n(`x?7qi;KYcI<q5ynZoVN|(l$YHp1iFP};8x%*oB7p4)%T_5g^JIz(}
zt~=(?+kbsAzvtc`)5jDwbj<yT<M(e%_^!E!CVH=Z))7AT8^`0@#vKlWmA~V!6n|}t
ziyuAoW<2n!lYjon$LO{h8~GK_&7^zI*U%5$ML3Rf?exw|n&?{wcGAHcn&SWQ*QJj5
z|Nd%mblI)(m$q4G3v<A+VPcrx{WDwKt?}?5INyz5s9i~qtTNJ9&QtRj)&Bm$EB^JL
z`Ck|GE)JK~$DjFGEx+RRtN2;f57Dx7?x)Slh~qCi5AYSf8{@BE_SK0GcmE=O_2T0W
z>OB?xpZ_kWw-oG&mmSg4v5R&5Eyv~bkDq%WuKjQgZR@<>@&3Acx?S;m$4|bumY;Lx
z9)8Z)8}v7|w@&=Q<&VE|$CdHThdI9ekK=URpAS1Wx0Tbscx^M?<~GG+4_wNhzke}*
z&ypbh^?QpQzj)#hef*wX@fR-odGm*_$sRuQl6iE=npf!6s)dd}9J<%>-PW`C7n=6+
z$LgPS+_3LD{`No4;V(T@#;=sWx!3;vv-z(XBJ{zhuA|@ByMcf6(IVch8K<utf7M~R
zhmMy#_%N^fx3hWq_J83on6byP<B98d_q%)Ii|)|VUGMzs;umYLYL*>)l)m!4UcO?L
zFTV4fEfc}6`y4-g*h@Emvuxs<ie~=ol4J1~SN1sGE_fi$?b}Ot6gSe58aF?9;olrj
z-1-y#z@>8j%@zCNk=PUbirT-$XDm3g`S$Oe%b!<B@(pY6<G)(=LHvMkKi~WCcNXtB
z_cnh0v+HSF@eTA@j_vV|x4ZdO6C|xJ_wrA__FVkdN1tnc|NQFs-~Q%_7oA(dU$yNT
z$KJWGHvhwPr1_$`PdN?+X~*HS1{}R}-fy1swdd)D&ZUkOoR&WK;1Wl}&EKAA_|;DO
zio0q4jko(Ic5plRyY>`2#<qTgj&H1WygKJB`t2WT_+`dN<F_x6@xSHnjW0h^=Xkne
zFU>7}uDPM)3CEG^zDuurN=Yk^-OL}f6+60*uXFso;XcQO%Q*f}r<Gn)(oe6QAmaC{
zj`Euie}g=7!x;Vbo9=YP-rwaoTCpVV8?K?}zI-eFzvM0PTW-5K-tf#^K6JwYdiQf%
z<GLZw#LL<r(QoyS^1r#|diu5vcQ!v_zL-AnjE=tgzrFnayN<=}&k_fps=Jz>pg-iF
z-2Tqui?6zW;^jZhq?hdcC%Ra<hhEe~@{bSQF(I41jDAs3Zm)Of58nOu;`mqg{Apr`
zK~BFibOHUmqOJLl=j`BPKUhTnl2p>)-Z3|R-+@0*G)fBSj{9r)_SNslUz&J?{;&4=
zbg1n+@oU~a>{$Eg1if|PmHgK)RmNZ1GtNK4-NLW=zHZ5dzqu^_NdHmC^`1VOd92bg
z{$L?rSKUhACfiHz_})$Q&U=FN@!Fs9cg#N0yyFLNHUD+x_52OTN8&#k4K?5Xhl9;O
znDqm`eEYw|H|(_0=iI0|c+QcZ@Ga+DMK9?t<G)ci!QXssfNtOGdFUU3oy~tbd`a9?
zP0&Y=?xQc>_H&10psrcs>UKmlMf{cDy1*f?*b}#}@8kcn>~4PBb#?T*>vrF#+_;<O
zs^%@Z^XPiV+BwU33pvh@QSZbzU9p5O+kaL3md?M&zc=J{jD2t!z4`B&_`ZiM^w*Z(
zGjaKABlHv3oK4?t{4Rfe_&WX%x7_47Ui>Y`ldJYSj_iCQ{+_<kv3N#X^9z@L+tK;&
zH#<siMQjHS(EDaz>A3vrr|E-Fzia==-rF4yzVv*&w(|G!N50?0GtbTBuay2J{zJZU
z;>BIX^cvM8&G!Fz)FHX|u8EHAU*#*v2k5amj)S+}`Cs%uzj7wMS95?q_G>G@o>1`b
zyxADP>UWp%wL4#S9KU#Z^DoP5Cw^N|yyW{|Uq)ZQ<SmDD&$W(c3^N~&9=(ko-u0{a
z<yt+j?pw)^?^g)(1^Vla4u?22IqaAE8piitcIkN6c-<=5e!?;CcDv8}5WR$7t0d9!
UzEwoWCB&Zb{Y1-n6y;m^e*!J_CIA2c

literal 0
HcmV?d00001

diff --git a/langcache/statistics/__init__.py b/langcache/statistics/__init__.py
new file mode 100644
index 0000000..e69de29
diff --git a/requirements.txt b/requirements.txt
new file mode 100644
index 0000000..7864127
--- /dev/null
+++ b/requirements.txt
@@ -0,0 +1,131 @@
+aenum==3.1.15
+aiohttp==3.9.0
+aiosignal==1.3.1
+anyio==3.7.1
+appnope==0.1.3
+asttokens==2.4.1
+attrs==23.1.0
+backcall==0.2.0
+beautifulsoup4==4.12.2
+bs4==0.0.1
+certifi==2023.11.17
+cffi==1.16.0
+charset-normalizer==3.3.2
+click==8.1.7
+comm==0.2.0
+contourpy==1.2.0
+cryptography==41.0.5
+cycler==0.12.1
+dataclasses-json==0.6.2
+debugpy==1.8.0
+decorator==5.1.1
+diskcache==5.6.3
+distro==1.8.0
+evadb==0.3.9
+executing==2.0.1
+faiss-cpu==1.7.4
+fastjsonschema==2.19.0
+filelock==3.13.1
+fonttools==4.45.1
+frozenlist==1.4.0
+fsspec==2023.10.0
+gpt4all==2.0.2
+h11==0.14.0
+httpcore==1.0.2
+httpx==0.25.1
+huggingface-hub==0.19.4
+idna==3.4
+iniconfig==2.0.0
+ipykernel==6.26.0
+ipython==8.12.3
+ipywidgets==8.1.1
+jedi==0.19.1
+Jinja2==3.1.2
+joblib==1.3.2
+jsonpatch==1.33
+jsonpointer==2.4
+jsonschema==4.20.0
+jsonschema-specifications==2023.11.1
+jupyter_client==8.6.0
+jupyter_core==5.5.0
+jupyterlab-widgets==3.0.9
+kiwisolver==1.4.5
+langcache==0.0.1
+langchain==0.0.340
+langsmith==0.0.66
+lark==1.1.8
+MarkupSafe==2.1.3
+marshmallow==3.20.1
+matplotlib==3.8.2
+matplotlib-inline==0.1.6
+mpmath==1.3.0
+multidict==6.0.4
+mypy-extensions==1.0.0
+nbclient==0.6.8
+nbformat==5.9.2
+nbmake==1.4.6
+nest-asyncio==1.5.8
+networkx==3.2.1
+nltk==3.8.1
+numpy==1.26.2
+openai==1.3.5
+packaging==23.2
+pandas==2.1.3
+parso==0.8.3
+pdfminer.six==20221105
+pexpect==4.9.0
+pickleshare==0.7.5
+Pillow==10.1.0
+platformdirs==4.0.0
+pluggy==1.3.0
+prompt-toolkit==3.0.41
+protobuf==4.25.1
+psutil==5.9.6
+ptyprocess==0.7.0
+pure-eval==0.2.2
+py==1.11.0
+pycparser==2.21
+pydantic==1.10.13
+Pygments==2.17.2
+PyMuPDF==1.22.5
+pyparsing==3.1.1
+pytest==7.4.3
+python-dateutil==2.8.2
+pytz==2023.3.post1
+PyYAML==6.0.1
+pyzmq==25.1.1
+rapidfuzz==3.5.2
+referencing==0.31.0
+regex==2023.10.3
+requests==2.31.0
+retry==0.9.2
+rpds-py==0.13.1
+safetensors==0.4.0
+scikit-learn==1.3.2
+scipy==1.11.4
+sentence-transformers==2.2.2
+sentencepiece==0.1.99
+six==1.16.0
+sniffio==1.3.0
+soupsieve==2.5
+SQLAlchemy==2.0.23
+SQLAlchemy-Utils==0.41.1
+stack-data==0.6.3
+sympy==1.12
+tenacity==8.2.3
+thefuzz==0.20.0
+threadpoolctl==3.2.0
+tokenizers==0.15.0
+torch==2.1.1
+torchvision==0.16.1
+tornado==6.3.3
+tqdm==4.66.1
+traitlets==5.13.0
+transformers==4.35.2
+typing-inspect==0.9.0
+typing_extensions==4.8.0
+tzdata==2023.3
+urllib3==2.1.0
+wcwidth==0.2.12
+widgetsnbextension==4.0.9
+yarl==1.9.3
diff --git a/setup.py b/setup.py
new file mode 100644
index 0000000..c89f095
--- /dev/null
+++ b/setup.py
@@ -0,0 +1,27 @@
+import setuptools
+
+with open("README.md", "r", encoding="utf-8") as fh:
+    long_description = fh.read()
+
+# Function to read the list of dependencies from requirements.txt
+def load_requirements(filename='requirements.txt'):
+    with open(filename, 'r') as file:
+        return file.read().splitlines()
+    
+setuptools.setup(
+    name="langcache",
+    version="0.0.1",
+    author="Georgia Tech Database Group",
+    author_email="jiashenc@gatech.edu",
+    description="A small example package",
+    long_description=long_description,
+    long_description_content_type="text/markdown",
+    url="https://github.com/jiashenC/langcache",
+    packages=setuptools.find_packages(),
+    classifiers=[
+        "Programming Language :: Python :: 3",
+        "Development Status :: 1 - Planning"
+    ],
+    python_requires='>=3.6',
+    install_requires=load_requirements(),
+)
diff --git a/test/open-ai-integration.ipynb b/test/open-ai-integration.ipynb
new file mode 100644
index 0000000..ee696db
--- /dev/null
+++ b/test/open-ai-integration.ipynb
@@ -0,0 +1,379 @@
+{
+ "cells": [
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Import dependencies\n",
+    "import os"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 3,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# get OpenAI key if needed\n",
+    "\n",
+    "try:\n",
+    "    api_key = os.environ[\"OPENAI_API_KEY\"]\n",
+    "except KeyError:\n",
+    "    api_key = str(input(\"🔑 Enter your OpenAI key: \"))\n",
+    "    os.environ[\"OPENAI_API_KEY\"] = api_key"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 4,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "/Users/swetavooda/workspace/langCache/langcache/langcache-venv/lib/python3.11/site-packages/sentence_transformers/SentenceTransformer.py:157: FutureWarning: Series.__getitem__ treating keys as positions is deprecated. In a future version, integer keys will always be treated as labels (consistent with DataFrame behavior). To access a value by position, use `ser.iloc[pos]`\n",
+      "  sentences_sorted = [sentences[idx] for idx in length_sorted_idx]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "QUESTION:  What is GitHub?\n",
+      "GitHub is a web-based platform for version control and collaboration, focusing on code sharing and projects.\n",
+      "Time taken:  1.8351471424102783\n",
+      "\n",
+      "\n",
+      "\n"
+     ]
+    },
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "/Users/swetavooda/workspace/langCache/langcache/langcache-venv/lib/python3.11/site-packages/sentence_transformers/SentenceTransformer.py:157: FutureWarning: Series.__getitem__ treating keys as positions is deprecated. In a future version, integer keys will always be treated as labels (consistent with DataFrame behavior). To access a value by position, use `ser.iloc[pos]`\n",
+      "  sentences_sorted = [sentences[idx] for idx in length_sorted_idx]\n",
+      "01-25-2024 19:49:43 WARNING[create_index_executor:create_index_executor.py:_create_evadb_index:0119] Index wubhlsyqed already exists. It will be updated on existing table.\n",
+      "/Users/swetavooda/workspace/langCache/langcache/langcache-venv/lib/python3.11/site-packages/sentence_transformers/SentenceTransformer.py:157: FutureWarning: Series.__getitem__ treating keys as positions is deprecated. In a future version, integer keys will always be treated as labels (consistent with DataFrame behavior). To access a value by position, use `ser.iloc[pos]`\n",
+      "  sentences_sorted = [sentences[idx] for idx in length_sorted_idx]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "QUESTION:  what are the most important concepts in databases\n",
+      "Relational model, tables, primary keys, foreign keys, normalization, and query language, such as SQL.\n",
+      "Time taken:  3.3530569076538086\n",
+      "\n",
+      "\n",
+      "\n"
+     ]
+    },
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "/Users/swetavooda/workspace/langCache/langcache/langcache-venv/lib/python3.11/site-packages/sentence_transformers/SentenceTransformer.py:157: FutureWarning: Series.__getitem__ treating keys as positions is deprecated. In a future version, integer keys will always be treated as labels (consistent with DataFrame behavior). To access a value by position, use `ser.iloc[pos]`\n",
+      "  sentences_sorted = [sentences[idx] for idx in length_sorted_idx]\n",
+      "01-25-2024 19:49:45 WARNING[create_index_executor:create_index_executor.py:_create_evadb_index:0119] Index wubhlsyqed already exists. It will be updated on existing table.\n",
+      "/Users/swetavooda/workspace/langCache/langcache/langcache-venv/lib/python3.11/site-packages/sentence_transformers/SentenceTransformer.py:157: FutureWarning: Series.__getitem__ treating keys as positions is deprecated. In a future version, integer keys will always be treated as labels (consistent with DataFrame behavior). To access a value by position, use `ser.iloc[pos]`\n",
+      "  sentences_sorted = [sentences[idx] for idx in length_sorted_idx]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "QUESTION:  can you explain what GitHub is\n",
+      "GitHub is a web-based platform where developers can collaborate on and store their code repositories.\n",
+      "Time taken:  2.42620587348938\n",
+      "\n",
+      "\n",
+      "\n"
+     ]
+    },
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "/Users/swetavooda/workspace/langCache/langcache/langcache-venv/lib/python3.11/site-packages/sentence_transformers/SentenceTransformer.py:157: FutureWarning: Series.__getitem__ treating keys as positions is deprecated. In a future version, integer keys will always be treated as labels (consistent with DataFrame behavior). To access a value by position, use `ser.iloc[pos]`\n",
+      "  sentences_sorted = [sentences[idx] for idx in length_sorted_idx]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "QUESTION:  What is GitHub?\n",
+      "GitHub is a web-based platform for version control and collaboration, focusing on code sharing and projects.\n",
+      "Time taken:  0.9597771167755127\n",
+      "\n",
+      "\n",
+      "\n"
+     ]
+    },
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "/Users/swetavooda/workspace/langCache/langcache/langcache-venv/lib/python3.11/site-packages/sentence_transformers/SentenceTransformer.py:157: FutureWarning: Series.__getitem__ treating keys as positions is deprecated. In a future version, integer keys will always be treated as labels (consistent with DataFrame behavior). To access a value by position, use `ser.iloc[pos]`\n",
+      "  sentences_sorted = [sentences[idx] for idx in length_sorted_idx]\n",
+      "01-25-2024 19:49:49 WARNING[create_index_executor:create_index_executor.py:_create_evadb_index:0119] Index wubhlsyqed already exists. It will be updated on existing table.\n",
+      "/Users/swetavooda/workspace/langCache/langcache/langcache-venv/lib/python3.11/site-packages/sentence_transformers/SentenceTransformer.py:157: FutureWarning: Series.__getitem__ treating keys as positions is deprecated. In a future version, integer keys will always be treated as labels (consistent with DataFrame behavior). To access a value by position, use `ser.iloc[pos]`\n",
+      "  sentences_sorted = [sentences[idx] for idx in length_sorted_idx]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "QUESTION:  what is the purpose of GitHub\n",
+      "The purpose of GitHub is to provide a platform for version control and collaboration on software development projects.\n",
+      "Time taken:  2.3775222301483154\n",
+      "\n",
+      "\n",
+      "\n"
+     ]
+    },
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "/Users/swetavooda/workspace/langCache/langcache/langcache-venv/lib/python3.11/site-packages/sentence_transformers/SentenceTransformer.py:157: FutureWarning: Series.__getitem__ treating keys as positions is deprecated. In a future version, integer keys will always be treated as labels (consistent with DataFrame behavior). To access a value by position, use `ser.iloc[pos]`\n",
+      "  sentences_sorted = [sentences[idx] for idx in length_sorted_idx]\n",
+      "01-25-2024 19:49:51 WARNING[create_index_executor:create_index_executor.py:_create_evadb_index:0119] Index wubhlsyqed already exists. It will be updated on existing table.\n",
+      "/Users/swetavooda/workspace/langCache/langcache/langcache-venv/lib/python3.11/site-packages/sentence_transformers/SentenceTransformer.py:157: FutureWarning: Series.__getitem__ treating keys as positions is deprecated. In a future version, integer keys will always be treated as labels (consistent with DataFrame behavior). To access a value by position, use `ser.iloc[pos]`\n",
+      "  sentences_sorted = [sentences[idx] for idx in length_sorted_idx]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "QUESTION:  What's github\n",
+      "GitHub is a web-based platform for version control and collaborative development of software projects.\n",
+      "Time taken:  2.712510824203491\n",
+      "\n",
+      "\n",
+      "\n"
+     ]
+    },
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "/Users/swetavooda/workspace/langCache/langcache/langcache-venv/lib/python3.11/site-packages/sentence_transformers/SentenceTransformer.py:157: FutureWarning: Series.__getitem__ treating keys as positions is deprecated. In a future version, integer keys will always be treated as labels (consistent with DataFrame behavior). To access a value by position, use `ser.iloc[pos]`\n",
+      "  sentences_sorted = [sentences[idx] for idx in length_sorted_idx]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "QUESTION:  What are the important topics to learn in databases?\n",
+      "Relational model, tables, primary keys, foreign keys, normalization, and query language, such as SQL.\n",
+      "Time taken:  1.801367998123169\n",
+      "\n",
+      "\n",
+      "\n"
+     ]
+    },
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "/Users/swetavooda/workspace/langCache/langcache/langcache-venv/lib/python3.11/site-packages/sentence_transformers/SentenceTransformer.py:157: FutureWarning: Series.__getitem__ treating keys as positions is deprecated. In a future version, integer keys will always be treated as labels (consistent with DataFrame behavior). To access a value by position, use `ser.iloc[pos]`\n",
+      "  sentences_sorted = [sentences[idx] for idx in length_sorted_idx]\n",
+      "01-25-2024 19:49:56 WARNING[create_index_executor:create_index_executor.py:_create_evadb_index:0119] Index wubhlsyqed already exists. It will be updated on existing table.\n",
+      "/Users/swetavooda/workspace/langCache/langcache/langcache-venv/lib/python3.11/site-packages/sentence_transformers/SentenceTransformer.py:157: FutureWarning: Series.__getitem__ treating keys as positions is deprecated. In a future version, integer keys will always be treated as labels (consistent with DataFrame behavior). To access a value by position, use `ser.iloc[pos]`\n",
+      "  sentences_sorted = [sentences[idx] for idx in length_sorted_idx]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "QUESTION:  List some topics to learn in databases\n",
+      "- Data modeling \n",
+      "- Relational databases \n",
+      "- SQL \n",
+      "- Query optimization \n",
+      "- Indexing \n",
+      "- Data normalization \n",
+      "- NoSQL databases \n",
+      "- Database administration \n",
+      "- Database security \n",
+      "- Data warehousing\n",
+      "Time taken:  3.0051629543304443\n",
+      "\n",
+      "\n",
+      "\n"
+     ]
+    },
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "/Users/swetavooda/workspace/langCache/langcache/langcache-venv/lib/python3.11/site-packages/sentence_transformers/SentenceTransformer.py:157: FutureWarning: Series.__getitem__ treating keys as positions is deprecated. In a future version, integer keys will always be treated as labels (consistent with DataFrame behavior). To access a value by position, use `ser.iloc[pos]`\n",
+      "  sentences_sorted = [sentences[idx] for idx in length_sorted_idx]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "QUESTION:  Can you tell me what Github is?\n",
+      "GitHub is a web-based platform where developers can collaborate on and store their code repositories.\n",
+      "Time taken:  0.9954211711883545\n",
+      "\n",
+      "\n",
+      "\n"
+     ]
+    },
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "/Users/swetavooda/workspace/langCache/langcache/langcache-venv/lib/python3.11/site-packages/sentence_transformers/SentenceTransformer.py:157: FutureWarning: Series.__getitem__ treating keys as positions is deprecated. In a future version, integer keys will always be treated as labels (consistent with DataFrame behavior). To access a value by position, use `ser.iloc[pos]`\n",
+      "  sentences_sorted = [sentences[idx] for idx in length_sorted_idx]\n",
+      "01-25-2024 19:50:00 WARNING[create_index_executor:create_index_executor.py:_create_evadb_index:0119] Index wubhlsyqed already exists. It will be updated on existing table.\n",
+      "/Users/swetavooda/workspace/langCache/langcache/langcache-venv/lib/python3.11/site-packages/sentence_transformers/SentenceTransformer.py:157: FutureWarning: Series.__getitem__ treating keys as positions is deprecated. In a future version, integer keys will always be treated as labels (consistent with DataFrame behavior). To access a value by position, use `ser.iloc[pos]`\n",
+      "  sentences_sorted = [sentences[idx] for idx in length_sorted_idx]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "QUESTION:  How I can speak English fluently?\n",
+      "Practice speaking regularly with native English speakers and immerse yourself in the language through reading and listening.\n",
+      "Time taken:  2.6009669303894043\n",
+      "\n",
+      "\n",
+      "\n"
+     ]
+    },
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "/Users/swetavooda/workspace/langCache/langcache/langcache-venv/lib/python3.11/site-packages/sentence_transformers/SentenceTransformer.py:157: FutureWarning: Series.__getitem__ treating keys as positions is deprecated. In a future version, integer keys will always be treated as labels (consistent with DataFrame behavior). To access a value by position, use `ser.iloc[pos]`\n",
+      "  sentences_sorted = [sentences[idx] for idx in length_sorted_idx]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "QUESTION:  How can I learn to speak English fluently?\n",
+      "Practice speaking regularly with native English speakers and immerse yourself in the language through reading and listening.\n",
+      "Time taken:  0.9783082008361816\n",
+      "\n",
+      "\n",
+      "\n"
+     ]
+    },
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "/Users/swetavooda/workspace/langCache/langcache/langcache-venv/lib/python3.11/site-packages/sentence_transformers/SentenceTransformer.py:157: FutureWarning: Series.__getitem__ treating keys as positions is deprecated. In a future version, integer keys will always be treated as labels (consistent with DataFrame behavior). To access a value by position, use `ser.iloc[pos]`\n",
+      "  sentences_sorted = [sentences[idx] for idx in length_sorted_idx]\n",
+      "01-25-2024 19:50:04 WARNING[create_index_executor:create_index_executor.py:_create_evadb_index:0119] Index wubhlsyqed already exists. It will be updated on existing table.\n",
+      "/Users/swetavooda/workspace/langCache/langcache/langcache-venv/lib/python3.11/site-packages/sentence_transformers/SentenceTransformer.py:157: FutureWarning: Series.__getitem__ treating keys as positions is deprecated. In a future version, integer keys will always be treated as labels (consistent with DataFrame behavior). To access a value by position, use `ser.iloc[pos]`\n",
+      "  sentences_sorted = [sentences[idx] for idx in length_sorted_idx]\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "QUESTION:  How does 3D printing work?\n",
+      "3D printing works by creating objects layer by layer using melted materials like plastic or metal.\n",
+      "Time taken:  3.003875732421875\n",
+      "\n",
+      "\n",
+      "\n",
+      "QUESTION:  How do 3D printing work?\n",
+      "3D printing works by creating objects layer by layer using melted materials like plastic or metal.\n",
+      "Time taken:  0.9676847457885742\n",
+      "\n",
+      "\n",
+      "\n"
+     ]
+    },
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "/Users/swetavooda/workspace/langCache/langcache/langcache-venv/lib/python3.11/site-packages/sentence_transformers/SentenceTransformer.py:157: FutureWarning: Series.__getitem__ treating keys as positions is deprecated. In a future version, integer keys will always be treated as labels (consistent with DataFrame behavior). To access a value by position, use `ser.iloc[pos]`\n",
+      "  sentences_sorted = [sentences[idx] for idx in length_sorted_idx]\n"
+     ]
+    }
+   ],
+   "source": [
+    "import time\n",
+    "from langcache.adapter.openai import OpenAI\n",
+    "from langcache.core import Cache\n",
+    "\n",
+    "cache = Cache(tune_frequency=5, tune_policy=\"recall\")\n",
+    "client = OpenAI(cache)\n",
+    "\n",
+    "results = []\n",
+    "questions = [\"What is GitHub?\", \n",
+    "             \"what are the most important concepts in databases\", \n",
+    "             \"can you explain what GitHub is\", \"What is GitHub?\", \n",
+    "             \"what is the purpose of GitHub\", \"What's github\", \n",
+    "             \"What are the important topics to learn in databases?\", \n",
+    "             \"List some topics to learn in databases\",\n",
+    "             \"Can you tell me what Github is?\",\n",
+    "             \"How I can speak English fluently?\",\n",
+    "             \"How can I learn to speak English fluently?\",\n",
+    "             \"How does 3D printing work?\",\n",
+    "             \"How do 3D printing work?\"]\n",
+    "for i in range(0,len(questions)):\n",
+    "  start_time = time.time()\n",
+    "  completion = client.chat.completions.create(\n",
+    "    model=\"gpt-3.5-turbo\",\n",
+    "    messages=[\n",
+    "      {\"role\": \"system\", \"content\":\"You are an helpful assistant to answer all my questions within 15 words limit\"},\n",
+    "      {\"role\": \"user\", \"content\": questions[i]}\n",
+    "    ]\n",
+    "  )\n",
+    "  end_time = time.time()\n",
+    "  print(\"QUESTION: \", questions[i])\n",
+    "  print(completion)\n",
+    "  print(\"Time taken: \", end_time-start_time)\n",
+    "  print(\"\\n\\n\")\n",
+    "  results.append(completion)\n",
+    "  \n"
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "langcache-venv",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.11.7"
+  },
+  "orig_nbformat": 4
+ },
+ "nbformat": 4,
+ "nbformat_minor": 2
+}