Spaces:

lizhen30
/

LangChainGo

Runtime error

App Files Files Community

远兮 commited on Jun 2, 2023

Commit

3de6db3

1 Parent(s): 56ac16d

add redis

Browse files

Files changed (8) hide show

app.py +3 -1
data/llm_test.csv +3 -1
index_bilibili.ipynb +19 -13
llms_asyncio.py +5 -3
openai_chat_prompt_template.py +5 -3
redis/test_common.ipynb +123 -0
redis/test_string.ipynb +111 -0
test_csv/test_pandas.ipynb +62 -20

app.py CHANGED Viewed

@@ -2,10 +2,12 @@ import gradio as gr
 from langchain.llms import OpenAI
 from langchain.llms import PromptLayerOpenAI
 def chatOpenAI(input):
     llm = OpenAI(temperature=0.9)
     return llm(input)
 def promptLayer(input):
     llm = PromptLayerOpenAI(pl_tags=["LangChainGo"])
     return llm(input)
@@ -14,4 +16,4 @@ def promptLayer(input):
 with gr.Blocks() as demo:
     gr.Markdown("# LangChain Test，LLM跑步上车。")
     gr.Interface(fn=promptLayer, inputs="text", outputs="text")
-demo.launch()

 from langchain.llms import OpenAI
 from langchain.llms import PromptLayerOpenAI
 def chatOpenAI(input):
     llm = OpenAI(temperature=0.9)
     return llm(input)
 def promptLayer(input):
     llm = PromptLayerOpenAI(pl_tags=["LangChainGo"])
     return llm(input)
 with gr.Blocks() as demo:
     gr.Markdown("# LangChain Test，LLM跑步上车。")
     gr.Interface(fn=promptLayer, inputs="text", outputs="text")
+demo.launch()

data/llm_test.csv CHANGED Viewed

@@ -1,6 +1,8 @@
 name,age,city,mark
-张三,100,河北,kk
 赵四,19,河北,kk
 赵五,100,河北,kk
 赵六,19,河北,kk
 王五,19,河北,kk

 name,age,city,mark
+张三,212,河北,kk
 赵四,19,河北,kk
 赵五,100,河北,kk
 赵六,19,河北,kk
 王五,19,河北,kk
+,name,age,city,mark
+0,张三,2345,河北,kk

index_bilibili.ipynb CHANGED Viewed

@@ -2,7 +2,7 @@
  "cells": [
   {
    "cell_type": "code",
-   "execution_count": null,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -11,7 +11,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 15,
    "metadata": {},
    "outputs": [],
    "source": [
@@ -20,29 +20,35 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 16,
    "metadata": {},
    "outputs": [],
    "source": [
     "loader = BiliBiliLoader(\n",
-    "    [\"https://www.bilibili.com/video/BV1xt411o7Xu/\"]\n",
     ")"
    ]
   },
   {
    "cell_type": "code",
-   "execution_count": 17,
    "metadata": {},
    "outputs": [
     {
-     "data": {
-      "text/plain": [
-       "[Document(page_content='\\n                Video Title: 【B站黑科技】如何给视频最快速加上字幕（CC字幕/外挂字幕功能介绍、教程，快速做字幕制作）,\\n                description: 目前手机端最新版已经支持该功能了，\\n有一些讲得不好的地方请指正，包涵一下吧~\\n如果有帮到你可以帮我的视频点一下推荐嘛~感谢观看~\\n\\n                Transcript: 哈喽大家好，我是莫多 字幕是让很多up主头疼的问题 有字幕的视频可以增加许多观感体验 但是如果逐字逐句打字幕 会消耗大量的精力 今天在无意之中看到了B站推出的新功能 外挂/CC(closed caption)字幕功能 这个功能可以说是非常贴心了 因为所有人都可以根据自己喜好 随意拖动字幕 包括字体、大小，亦或是关闭字幕 因为在帮助界面里面没有找到具体的使用说明 我简单琢磨了一下 把我使用的心得分享一下吧 我们经常可以看到 会有野生的字幕君帮忙打字幕 但是以弹幕做字幕的话难免会有对不准的问题存在 我先给大家演示一下最简单制作字幕的方法 因为现在暂时没有办法 给别人的视频添加字幕 然后我就以我的视频为例吧 在字幕功能里面选择添加字幕 弹出的窗口里面 选择编辑 我们可以在播放的时候一边播放 一边插入字幕 这里可以看到 这里有个按钮是 我们可以以文档的方式上传字幕 目前常见支持的字幕格式貌似只有ASS 而其他常见字幕格式 如SRT，SSA，SUP还不能够支持 那么要怎样才能既快速又高效制作字幕呢? 这里我向各个UP主推荐一个非常好用的软件 它的名字叫做 （现在是收费软件）\\n人人译视界 （现在是收费软件）\\n因为它可以将我们 （现在是收费软件）\\n上传视频做成字幕 （现在是收费软件）\\n而且每段字幕都卡好时间点 （现在是收费软件）\\n大大减小了打字幕的时间 （现在是收费软件）\\n而且目前这是一款免费软件 （现在是收费软件）\\n不过就算以后收费了我也会非常乐意使用它 因为它集齐了听译和做字幕两个功能 对视频创作者来说有了这款软件 简直是如虎添翼呀 现在我给大家简单做个例子 我先把视频 当然音频也可以 拖到这款软件里面 然后点击AI听译 点击中译英  然后再点击（仅上传音频 ） 当然日语什么的也可以 但是最好是你已经做好了视频里面 不带背景音乐（BGM）的 这样它识别会更容易 然后选择只上传音频文件 然后选择AI听译 然后过一段时间他就会 开始上传 再过一段时间的话他就会 提示你转换完成 如果说有个别错别字话可以自己调整一下 （像我闽南口音比较重的话就要改很多字233） 然后这边分栏有许多功能 主要使用的是拆分和合并 拆分字幕和合并字幕 主要是合并为单行 （还有删除操作，选中字幕→Delete键） 如果你上传的 是中文视频的话AI听译里面 选择中译英 后面就是全选所有字幕（Ctrl+A） 点击清除译文就好了 （可以通过窗口左上角视频播放调整字幕） 调整好后导出字幕 选择ASS格式 当然我现在没有仔细做(主要是做个例子） ASS格式 这里就先导入到桌面上吧 （注意，这里选项→文本编码→选择UTF~16LE） （否则上传可能显示时间不合法） 因为会有一点点兼容的问题 我们还需要用记事本打开这个文档 然后将里面的这个部分 用替换功能把它替换掉 编辑→替换 将这个替换为空→全部替换 这里表示的应该是一个回车符的意思 但是播放器是不会显示出来的 B站上的外挂字幕功能的话就会显示 所以需要去掉 以后如果这个功能改进的话我也会在字幕里备注的 这时候（保存一下）便可以上传到B站上了 浏览一下如果没什么问题的话便可以提交了 或者是保存草稿 最后简单总结一下 内嵌和外挂字幕的优缺点吧 内嵌字幕的优点是样式多 但不能按照观众的每个人喜好去设置 外挂字幕的优点是 可以自由开启或关闭字幕 也可以���据每个人 自己的喜好来选择 特别是对一些生肉视频 有特殊需求者可以下载不带字幕的原视频 同时也不影响其他人观看体验 （还可以不带字幕截图） 对于B站推出的这个新功能我是非常支持的 好的 本次的视频就到这里了 有的内容讲得不太好 希望大家多多包涵 喜欢的朋友可以点个推荐吧 谢谢观看(❁´ω`❁)\\n                ', metadata={'bvid': 'BV1xt411o7Xu', 'aid': 34218168, 'videos': 1, 'tid': 122, 'tname': '野生技能协会', 'copyright': 1, 'pic': 'http://i0.hdslb.com/bfs/archive/c6d6d31048b587b00e9b87b586cc083ddfaa2106.jpg', 'title': '【B站黑科技】如何给视频最快速加上字幕（CC字幕/外挂字幕功能介绍、教程，快速做字幕制作）', 'pubdate': 1540029603, 'ctime': 1540019978, 'desc': '目前手机端最新版已经支持该功能了，\\n有一些讲得不好的地方请指正，包涵一下吧~\\n如果有帮到你可以帮我的视频点一下推荐嘛~感谢观看~', 'desc_v2': [{'raw_text': '目前手机端最新版已经支持该功能了，\\n有一些讲得不好的地方请指正，包涵一下吧~\\n如果有帮到你可以帮我的视频点一下推荐嘛~感谢观看~', 'type': 1, 'biz_id': 0}], 'state': 0, 'duration': 408, 'rights': {'bp': 0, 'elec': 0, 'download': 1, 'movie': 0, 'pay': 0, 'hd5': 0, 'no_reprint': 1, 'autoplay': 1, 'ugc_pay': 0, 'is_cooperation': 0, 'ugc_pay_preview': 0, 'no_background': 0, 'clean_mode': 0, 'is_stein_gate': 0, 'is_360': 0, 'no_share': 0, 'arc_pay': 0, 'free_watch': 0}, 'owner': {'mid': 1865692, 'name': '莫多是攻', 'face': 'http://i1.hdslb.com/bfs/face/83d880d545cc9dcf948a7ce4204477aadf275cd7.jpg'}, 'stat': {'aid': 34218168, 'view': 125606, 'danmaku': 170, 'reply': 327, 'favorite': 3701, 'coin': 1017, 'share': 494, 'now_rank': 0, 'his_rank': 0, 'like': 2631, 'dislike': 0, 'evaluation': '', 'argue_msg': ''}, 'dynamic': '#经验分享##视频教程##教学视频#', 'cid': 59939848, 'dimension': {'width': 1920, 'height': 1080, 'rotate': 0}, 'premiere': None, 'teenage_mode': 0, 'is_chargeable_season': False, 'is_story': False, 'no_cache': False, 'pages': [{'cid': 59939848, 'page': 1, 'from': 'vupload', 'part': 'P1', 'duration': 408, 'vid': '', 'weblink': '', 'dimension': {'width': 1920, 'height': 1080, 'rotate': 0}}], 'is_season_display': False, 'user_garb': {'url_image_ani_cut': ''}, 'honor_reply': {}, 'like_icon': '', 'need_jump_bv': False, 'url': 'https://www.bilibili.com/video/BV1xt411o7Xu/'})]"
-      ]
-     },
-     "execution_count": 17,
-     "metadata": {},
-     "output_type": "execute_result"
     }
    ],
    "source": [

  "cells": [
   {
    "cell_type": "code",
+   "execution_count": 5,
    "metadata": {},
    "outputs": [],
    "source": [
   },
   {
    "cell_type": "code",
+   "execution_count": 6,
    "metadata": {},
    "outputs": [],
    "source": [
   },
   {
    "cell_type": "code",
+   "execution_count": 7,
    "metadata": {},
    "outputs": [],
    "source": [
     "loader = BiliBiliLoader(\n",
+    "    [\"https://www.bilibili.com/video/BV1DP411m7TR/\"]\n",
     ")"
    ]
   },
   {
    "cell_type": "code",
+   "execution_count": 8,
    "metadata": {},
    "outputs": [
     {
+     "ename": "RuntimeError",
+     "evalue": "This event loop is already running",
+     "output_type": "error",
+     "traceback": [
+      "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
+      "\u001b[0;31mRuntimeError\u001b[0m                              Traceback (most recent call last)",
+      "Cell \u001b[0;32mIn[8], line 1\u001b[0m\n\u001b[0;32m----> 1\u001b[0m loader\u001b[39m.\u001b[39;49mload()\n",
+      "File \u001b[0;32m~/anaconda3/lib/python3.10/site-packages/langchain/document_loaders/bilibili.py:23\u001b[0m, in \u001b[0;36mBiliBiliLoader.load\u001b[0;34m(self)\u001b[0m\n\u001b[1;32m     21\u001b[0m results \u001b[39m=\u001b[39m []\n\u001b[1;32m     22\u001b[0m \u001b[39mfor\u001b[39;00m url \u001b[39min\u001b[39;00m \u001b[39mself\u001b[39m\u001b[39m.\u001b[39mvideo_urls:\n\u001b[0;32m---> 23\u001b[0m     transcript, video_info \u001b[39m=\u001b[39m \u001b[39mself\u001b[39;49m\u001b[39m.\u001b[39;49m_get_bilibili_subs_and_info(url)\n\u001b[1;32m     24\u001b[0m     doc \u001b[39m=\u001b[39m Document(page_content\u001b[39m=\u001b[39mtranscript, metadata\u001b[39m=\u001b[39mvideo_info)\n\u001b[1;32m     25\u001b[0m     results\u001b[39m.\u001b[39mappend(doc)\n",
+      "File \u001b[0;32m~/anaconda3/lib/python3.10/site-packages/langchain/document_loaders/bilibili.py:51\u001b[0m, in \u001b[0;36mBiliBiliLoader._get_bilibili_subs_and_info\u001b[0;34m(self, url)\u001b[0m\n\u001b[1;32m     48\u001b[0m     \u001b[39melse\u001b[39;00m:\n\u001b[1;32m     49\u001b[0m         \u001b[39mraise\u001b[39;00m \u001b[39mValueError\u001b[39;00m(\u001b[39mf\u001b[39m\u001b[39m\"\u001b[39m\u001b[39m{\u001b[39;00murl\u001b[39m}\u001b[39;00m\u001b[39m is not bilibili url.\u001b[39m\u001b[39m\"\u001b[39m)\n\u001b[0;32m---> 51\u001b[0m video_info \u001b[39m=\u001b[39m sync(v\u001b[39m.\u001b[39;49mget_info())\n\u001b[1;32m     52\u001b[0m video_info\u001b[39m.\u001b[39mupdate({\u001b[39m\"\u001b[39m\u001b[39murl\u001b[39m\u001b[39m\"\u001b[39m: url})\n\u001b[1;32m     54\u001b[0m \u001b[39m# Get subtitle url\u001b[39;00m\n",
+      "File \u001b[0;32m~/anaconda3/lib/python3.10/site-packages/bilibili_api/utils/sync.py:24\u001b[0m, in \u001b[0;36msync\u001b[0;34m(coroutine)\u001b[0m\n\u001b[1;32m     22\u001b[0m __ensure_event_loop()\n\u001b[1;32m     23\u001b[0m loop \u001b[39m=\u001b[39m asyncio\u001b[39m.\u001b[39mget_event_loop()\n\u001b[0;32m---> 24\u001b[0m \u001b[39mreturn\u001b[39;00m loop\u001b[39m.\u001b[39;49mrun_until_complete(coroutine)\n",
+      "File \u001b[0;32m~/anaconda3/lib/python3.10/asyncio/base_events.py:625\u001b[0m, in \u001b[0;36mBaseEventLoop.run_until_complete\u001b[0;34m(self, future)\u001b[0m\n\u001b[1;32m    614\u001b[0m \u001b[39m\u001b[39m\u001b[39m\"\"\"Run until the Future is done.\u001b[39;00m\n\u001b[1;32m    615\u001b[0m \n\u001b[1;32m    616\u001b[0m \u001b[39mIf the argument is a coroutine, it is wrapped in a Task.\u001b[39;00m\n\u001b[0;32m   (...)\u001b[0m\n\u001b[1;32m    622\u001b[0m \u001b[39mReturn the Future's result, or raise its exception.\u001b[39;00m\n\u001b[1;32m    623\u001b[0m \u001b[39m\"\"\"\u001b[39;00m\n\u001b[1;32m    624\u001b[0m \u001b[39mself\u001b[39m\u001b[39m.\u001b[39m_check_closed()\n\u001b[0;32m--> 625\u001b[0m \u001b[39mself\u001b[39;49m\u001b[39m.\u001b[39;49m_check_running()\n\u001b[1;32m    627\u001b[0m new_task \u001b[39m=\u001b[39m \u001b[39mnot\u001b[39;00m futures\u001b[39m.\u001b[39misfuture(future)\n\u001b[1;32m    628\u001b[0m future \u001b[39m=\u001b[39m tasks\u001b[39m.\u001b[39mensure_future(future, loop\u001b[39m=\u001b[39m\u001b[39mself\u001b[39m)\n",
+      "File \u001b[0;32m~/anaconda3/lib/python3.10/asyncio/base_events.py:584\u001b[0m, in \u001b[0;36mBaseEventLoop._check_running\u001b[0;34m(self)\u001b[0m\n\u001b[1;32m    582\u001b[0m \u001b[39mdef\u001b[39;00m \u001b[39m_check_running\u001b[39m(\u001b[39mself\u001b[39m):\n\u001b[1;32m    583\u001b[0m     \u001b[39mif\u001b[39;00m \u001b[39mself\u001b[39m\u001b[39m.\u001b[39mis_running():\n\u001b[0;32m--> 584\u001b[0m         \u001b[39mraise\u001b[39;00m \u001b[39mRuntimeError\u001b[39;00m(\u001b[39m'\u001b[39m\u001b[39mThis event loop is already running\u001b[39m\u001b[39m'\u001b[39m)\n\u001b[1;32m    585\u001b[0m     \u001b[39mif\u001b[39;00m events\u001b[39m.\u001b[39m_get_running_loop() \u001b[39mis\u001b[39;00m \u001b[39mnot\u001b[39;00m \u001b[39mNone\u001b[39;00m:\n\u001b[1;32m    586\u001b[0m         \u001b[39mraise\u001b[39;00m \u001b[39mRuntimeError\u001b[39;00m(\n\u001b[1;32m    587\u001b[0m             \u001b[39m'\u001b[39m\u001b[39mCannot run the event loop while another loop is running\u001b[39m\u001b[39m'\u001b[39m)\n",
+      "\u001b[0;31mRuntimeError\u001b[0m: This event loop is already running"
+     ]
     }
    ],
    "source": [

llms_asyncio.py CHANGED Viewed

@@ -3,6 +3,7 @@ import asyncio
 from langchain.llms import OpenAI
 def generate_serially():
     llm = OpenAI(temperature=0.9)
     for _ in range(10):
@@ -23,11 +24,12 @@ async def generate_concurrently():
 s = time.perf_counter()
 # If running this outside of Jupyter, use asyncio.run(generate_concurrently())
-generate_concurrently()
 elapsed = time.perf_counter() - s
-print('\033[1m' + f"Concurrent executed in {elapsed:0.2f} seconds." + '\033[0m')
 s = time.perf_counter()
 generate_serially()
 elapsed = time.perf_counter() - s
-print('\033[1m' + f"Serial executed in {elapsed:0.2f} seconds." + '\033[0m')

 from langchain.llms import OpenAI
 def generate_serially():
     llm = OpenAI(temperature=0.9)
     for _ in range(10):
 s = time.perf_counter()
 # If running this outside of Jupyter, use asyncio.run(generate_concurrently())
+generate_concurrently()
 elapsed = time.perf_counter() - s
+print('\033[1m' +
+      f"Concurrent executed in {elapsed:0.2f} seconds." + '\033[0m')
 s = time.perf_counter()
 generate_serially()
 elapsed = time.perf_counter() - s
+print('\033[1m' + f"Serial executed in {elapsed:0.2f} seconds." + '\033[0m')

openai_chat_prompt_template.py CHANGED Viewed

@@ -15,11 +15,13 @@ human_template = "{text}"
 human_message_prompt = HumanMessagePromptTemplate.from_template(human_template)
 # 这里是使用chat请求，返回BaseMessage。
-chat_prompt = ChatPromptTemplate.from_messages([system_message_prompt, human_message_prompt])
-result = chat(chat_prompt.format_prompt(input_language="中文", output_language="英语", text="我想请假").to_messages())
 print(result.content)
 # 这里是使用chain请求，返回str, 带有聊天模型的chain。
 chain = LLMChain(llm=chat, prompt=chat_prompt)
 result = chain.run(input_language="中文", output_language="英语", text="我想请假")
-print(result)

 human_message_prompt = HumanMessagePromptTemplate.from_template(human_template)
 # 这里是使用chat请求，返回BaseMessage。
+chat_prompt = ChatPromptTemplate.from_messages(
+    [system_message_prompt, human_message_prompt])
+result = chat(chat_prompt.format_prompt(input_language="中文",
+              output_language="英语", text="我想请假").to_messages())
 print(result.content)
 # 这里是使用chain请求，返回str, 带有聊天模型的chain。
 chain = LLMChain(llm=chat, prompt=chat_prompt)
 result = chain.run(input_language="中文", output_language="英语", text="我想请假")
+print(result)

redis/test_common.ipynb ADDED Viewed

	@@ -0,0 +1,123 @@

+{
+ "cells": [
+  {
+   "cell_type": "code",
+   "execution_count": 13,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import redis\n",
+    "\n",
+    "conn_pool = redis.ConnectionPool(host='10.254.13.87', port='6379', max_connections=10)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 14,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "[b'user', b'test_hello', b'www.biancheng.net', b'test_list', b'test_hash', b'test_set', b'fans:num', b'user:id:01:username']\n"
+     ]
+    }
+   ],
+   "source": [
+    "r = redis.Redis(connection_pool=conn_pool)\n",
+    "key_list = r.keys('*')\n",
+    "print(key_list)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 15,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "user b'hash'\n",
+      "test_hello b'string'\n",
+      "www.biancheng.net b'string'\n",
+      "test_list b'list'\n",
+      "test_hash b'hash'\n",
+      "test_set b'set'\n",
+      "fans:num b'string'\n",
+      "user:id:01:username b'string'\n"
+     ]
+    }
+   ],
+   "source": [
+    "for key in key_list:\n",
+    "    keyStr = key.decode()\n",
+    "    print(keyStr, r.type(keyStr))"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 19,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "b'hash'\n",
+      "1\n",
+      "0\n"
+     ]
+    }
+   ],
+   "source": [
+    "print(r.type('user'))\n",
+    "print(r.exists('test_hello'))\n",
+    "print(r.exists('user1'))"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 24,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "0\n",
+      "0\n"
+     ]
+    }
+   ],
+   "source": [
+    "delete_result = r.delete('test_hello', 'test_hell2')\n",
+    "print(delete_result)\n",
+    "print(r.exists('test_hello'))"
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "base",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.10.10"
+  },
+  "orig_nbformat": 4
+ },
+ "nbformat": 4,
+ "nbformat_minor": 2
+}

redis/test_string.ipynb ADDED Viewed

	@@ -0,0 +1,111 @@

+{
+ "cells": [
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import redis\n",
+    "\n",
+    "r = redis.Redis(host='10.254.13.87', port='6379', db=0)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 2,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "b'math'\n"
+     ]
+    }
+   ],
+   "source": [
+    "r.set('subject', 'math')\n",
+    "print(r.get('subject'))"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 3,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "[b'lizhen', b'123']\n",
+      "6\n"
+     ]
+    }
+   ],
+   "source": [
+    "r.mset({'username': 'lizhen', 'password': '123'})\n",
+    "print(r.mget('username', 'password'))\n",
+    "print(r.strlen('username'))"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 7,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "b'18'\n",
+      "b'20'\n",
+      "b'17'\n",
+      "b'18'\n",
+      "b'17'\n",
+      "19.19999999999999929\n",
+      "9.19999999999999929\n"
+     ]
+    }
+   ],
+   "source": [
+    "r.set('age','18')\n",
+    "print(r.get('age'))\n",
+    "r.incrby('age', 2)\n",
+    "print(r.get('age'))\n",
+    "r.decrby('age', 3)\n",
+    "print(r.get('age'))\n",
+    "r.incr('age')\n",
+    "print(r.get('age'))\n",
+    "r.decr('age')\n",
+    "print(r.get('age'))\n",
+    "r.incrbyfloat('age', 2.2)\n",
+    "print(r.get('age').decode())\n",
+    "r.incrbyfloat('age', -10)\n",
+    "print(r.get('age').decode())"
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "base",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.10.10"
+  },
+  "orig_nbformat": 4
+ },
+ "nbformat": 4,
+ "nbformat_minor": 2
+}

test_csv/test_pandas.ipynb CHANGED Viewed

@@ -2,55 +2,97 @@
  "cells": [
   {
    "cell_type": "code",
-   "execution_count": 4,
    "metadata": {},
    "outputs": [],
    "source": [
-    "from langchain.document_loaders.csv_loader import CSVLoader\n",
-    "from langchain.docstore.document import Document"
    ]
   },
   {
    "cell_type": "code",
-   "execution_count": 5,
    "metadata": {},
    "outputs": [],
    "source": [
-    "loader = CSVLoader(file_path='data/llm_test.csv')\n",
     "\n",
-    "csv = loader.load()"
    ]
   },
   {
    "cell_type": "code",
    "execution_count": 6,
    "metadata": {},
    "outputs": [
     {
-     "ename": "TypeError",
-     "evalue": "__init__() takes exactly 1 positional argument (3 given)",
-     "output_type": "error",
-     "traceback": [
-      "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
-      "\u001b[0;31mTypeError\u001b[0m                                 Traceback (most recent call last)",
-      "Cell \u001b[0;32mIn[6], line 1\u001b[0m\n\u001b[0;32m----> 1\u001b[0m new_document \u001b[39m=\u001b[39m Document(\u001b[39m\"\u001b[39;49m\u001b[39mllm test by lizhen\u001b[39;49m\u001b[39m\"\u001b[39;49m, {\u001b[39m\"\u001b[39;49m\u001b[39ma\u001b[39;49m\u001b[39m\"\u001b[39;49m: \u001b[39m\"\u001b[39;49m\u001b[39m1\u001b[39;49m\u001b[39m\"\u001b[39;49m, \u001b[39m\"\u001b[39;49m\u001b[39mb\u001b[39;49m\u001b[39m\"\u001b[39;49m: \u001b[39m\"\u001b[39;49m\u001b[39m2\u001b[39;49m\u001b[39m\"\u001b[39;49m, \u001b[39m\"\u001b[39;49m\u001b[39mc\u001b[39;49m\u001b[39m\"\u001b[39;49m: \u001b[39m\"\u001b[39;49m\u001b[39m3\u001b[39;49m\u001b[39m\"\u001b[39;49m})\n\u001b[1;32m      2\u001b[0m csv\u001b[39m.\u001b[39minsert(new_document)\n",
-      "File \u001b[0;32m~/anaconda3/lib/python3.10/site-packages/pydantic/main.py:332\u001b[0m, in \u001b[0;36mpydantic.main.BaseModel.__init__\u001b[0;34m()\u001b[0m\n",
-      "\u001b[0;31mTypeError\u001b[0m: __init__() takes exactly 1 positional argument (3 given)"
      ]
     }
    ],
    "source": [
-    "new_document = Document(page_content='\\ufeff日期: 20230312\\nsn: 703052302050002380\\n是否内测用户: 0\\nquery_sentence: 帮我批改这些练习题\\ndomain: 1000726\\ndomain释义: null\\ndomain_support: 1\\nresult_support: 1\\nintent_support: 1\\nquery_intent: 1\\n: ' metadata={'source': 'data/xbxb.csv', 'row': 0})\n",
-    "csv.insert(new_document)"
    ]
   },
   {
    "cell_type": "code",
-   "execution_count": null,
    "metadata": {},
-   "outputs": [],
    "source": [
-    "print(data)"
    ]
   }
  ],

  "cells": [
   {
    "cell_type": "code",
+   "execution_count": 1,
    "metadata": {},
    "outputs": [],
    "source": [
+    "import pandas as pd"
    ]
   },
   {
    "cell_type": "code",
+   "execution_count": 7,
    "metadata": {},
    "outputs": [],
    "source": [
+    "# 定义要写入的数据\n",
+    "data = [\n",
+    "    ['王五', '19', '河北', 'kk']\n",
+    "]\n",
+    "\n",
+    "# 创建DataFrame对象\n",
+    "df = pd.DataFrame(data, columns=['name', 'age', 'city', 'mark'])\n",
     "\n",
+    "# 将DataFrame写入CSV文件\n",
+    "df.to_csv('../data/llm_test.csv', index=False, mode='a', header=False)\n"
    ]
   },
   {
    "cell_type": "code",
    "execution_count": 6,
    "metadata": {},
+   "outputs": [],
+   "source": [
+    "# 读取CSV文件到DataFrame\n",
+    "df = pd.read_csv('../data/llm_test.csv')\n",
+    "# 修改特定行列的数据\n",
+    "row_index = 0  # 要修改的行索引，除去表头，从0开始\n",
+    "column_name = 'age'  # 要修改的列名\n",
+    "new_value = '2345'  # 修改后的值\n",
+    "\n",
+    "df.loc[row_index, column_name] = new_value\n",
+    "# 将修改后的DataFrame写回到CSV文件\n",
+    "df.to_csv('../data/llm_test.csv', index=True)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 20,
+   "metadata": {},
    "outputs": [
     {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "name    2\n",
+      "age     2\n",
+      "city    2\n",
+      "mark    2\n",
+      "dtype: int64\n"
      ]
     }
    ],
    "source": [
+    "# 读取CSV文件到DataFrame\n",
+    "df = pd.read_csv('../data/llm_test.csv')\n",
+    "\n",
+    "# 查找满足特定条件的行数据\n",
+    "condition = df['age'] == 100  # 以Column1列为例，查找值为'Value1'的行\n",
+    "filtered_data = df[condition]\n",
+    "\n",
+    "# 打印查找结果\n",
+    "print(filtered_data)\n"
    ]
   },
   {
    "cell_type": "code",
+   "execution_count": 4,
    "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "  name  age city mark\n",
+      "0   张三  100   河北   kk\n",
+      "1   赵四   19   河北   kk\n",
+      "2   赵五  100   河北   kk\n"
+     ]
+    }
+   ],
    "source": [
+    "df = pd.read_csv('../data/llm_test.csv').head(3)\n",
+    "print(df)"
    ]
   }
  ],