2714.html 36 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693
  1. <!DOCTYPE html>
  2. <html lang="en" data-default-color-scheme=auto>
  3. <head><!-- hexo injector head_begin start -->
  4. <script async src="https://analytics.umami.is/script.js" data-website-id="e59ec28a-c9a7-4104-9e62-a9f7eb3fac0b"></script>
  5. <!-- hexo injector head_begin end -->
  6. <meta charset="UTF-8">
  7. <link rel="apple-touch-icon" sizes="76x76" href="https://img.limour.top/2023/08/29/64ee07361815a.webp">
  8. <link rel="icon" href="https://img.limour.top/2023/08/29/64ee07361815a.webp">
  9. <meta name="viewport" content="width=device-width, initial-scale=1.0, maximum-scale=5.0, shrink-to-fit=no">
  10. <meta http-equiv="x-ua-compatible" content="ie=edge">
  11. <meta name="theme-color" content="#2f4154">
  12. <meta name="author" content="Limour">
  13. <meta name="keywords" content="">
  14. <meta name="description" content="Chroma是一个可以帮助计算机理解文本的工具。它可以让你把文本放到一个“盒子”里,这个“盒子”可以让计算机更容易地找到和理解文本。你可以用它来创建一个文本库,然后通过输入问题,找到和问题相关的文本。比如,你可以创建一个文本库,里面有许多关于历史的文章,然后你可以输入“什么是古代中国的四大发明”,Chroma就可以帮你找到相关的文章。Chroma还有很多其他的功能,可以让你更方便地管理和搜索文本。">
  15. <meta property="og:type" content="article">
  16. <meta property="og:title" content="基于Chroma搭建个人知识库的全文索引">
  17. <meta property="og:url" content="https://occdn.limour.top/2714.html">
  18. <meta property="og:site_name" content="Limour&#39;s Blog">
  19. <meta property="og:description" content="Chroma是一个可以帮助计算机理解文本的工具。它可以让你把文本放到一个“盒子”里,这个“盒子”可以让计算机更容易地找到和理解文本。你可以用它来创建一个文本库,然后通过输入问题,找到和问题相关的文本。比如,你可以创建一个文本库,里面有许多关于历史的文章,然后你可以输入“什么是古代中国的四大发明”,Chroma就可以帮你找到相关的文章。Chroma还有很多其他的功能,可以让你更方便地管理和搜索文本。">
  20. <meta property="og:locale" content="en_US">
  21. <meta property="article:published_time" content="2023-04-26T15:22:57.000Z">
  22. <meta property="article:modified_time" content="2023-09-01T13:28:03.721Z">
  23. <meta property="article:author" content="Limour">
  24. <meta name="twitter:card" content="summary_large_image">
  25. <title>基于Chroma搭建个人知识库的全文索引 - Limour&#39;s Blog</title>
  26. <link rel="stylesheet" href="https://jscdn.limour.top/npm/bootstrap@4.6.1/dist/css/bootstrap.min.css" />
  27. <link rel="stylesheet" href="https://jscdn.limour.top/npm/github-markdown-css@4.0.0/github-markdown.min.css" />
  28. <link rel="stylesheet" href="https://jscdn.limour.top/npm/hint.css@2.7.0/hint.min.css" />
  29. <link rel="stylesheet" href="https://lib.baomitu.com/fancybox/3.5.7/jquery.fancybox.min.css" />
  30. <!-- 主题依赖的图标库,不要自行修改 -->
  31. <!-- Do not modify the link that theme dependent icons -->
  32. <link rel="stylesheet" href="//at.alicdn.com/t/font_1749284_hj8rtnfg7um.css">
  33. <link rel="stylesheet" href="//at.alicdn.com/t/font_1736178_lbnruvf0jn.css">
  34. <link rel="stylesheet" href="/css/main.css" />
  35. <link id="highlight-css" rel="stylesheet" href="/css/highlight.css" />
  36. <link id="highlight-css-dark" rel="stylesheet" href="/css/highlight-dark.css" />
  37. <link rel="stylesheet" href="/theme-inject/custom.css">
  38. <script id="fluid-configs">
  39. var Fluid = window.Fluid || {};
  40. Fluid.ctx = Object.assign({}, Fluid.ctx)
  41. var CONFIG = {"hostname":"occdn.limour.top","root":"/","version":"1.9.5-a","typing":{"enable":true,"typeSpeed":70,"cursorChar":"_","loop":false,"scope":[]},"anchorjs":{"enable":true,"element":"h1,h2,h3,h4,h5,h6","placement":"left","visible":"hover","icon":"§"},"progressbar":{"enable":true,"height_px":3,"color":"#29d","options":{"showSpinner":false,"trickleSpeed":100}},"code_language":{"enable":true,"default":"TEXT"},"copy_btn":true,"image_caption":{"enable":true},"image_zoom":{"enable":true,"img_url_replace":["",""]},"toc":{"enable":true,"placement":"right","headingSelector":"h1,h2,h3,h4,h5,h6","collapseDepth":0},"lazyload":{"enable":true,"loading_img":"https://jscdn.limour.top/gh/Limour-dev/Sakurairo_Vision/load_svg/inload.svg","onlypost":false,"offset_factor":2},"web_analytics":{"enable":false,"follow_dnt":true,"baidu":null,"google":{"measurement_id":null},"tencent":{"sid":null,"cid":null},"woyaola":null,"cnzz":null,"leancloud":{"app_id":null,"app_key":null,"server_url":null,"path":"window.location.pathname","ignore_local":false}},"search_path":"/local-search.xml","include_content_in_search":true};
  42. if (CONFIG.web_analytics.follow_dnt) {
  43. var dntVal = navigator.doNotTrack || window.doNotTrack || navigator.msDoNotTrack;
  44. Fluid.ctx.dnt = dntVal && (dntVal.startsWith('1') || dntVal.startsWith('yes') || dntVal.startsWith('on'));
  45. }
  46. </script>
  47. <script src="/js/utils.js" ></script>
  48. <script src="/js/color-schema.js" ></script>
  49. <meta name="generator" content="Hexo 6.3.0"></head>
  50. <body>
  51. <header>
  52. <div class="header-inner" style="height: 70vh;">
  53. <nav id="navbar" class="navbar fixed-top navbar-expand-lg navbar-dark scrolling-navbar">
  54. <div class="container">
  55. <a class="navbar-brand" href="/">
  56. <strong>Limour&#39;s Blog</strong>
  57. </a>
  58. <button id="navbar-toggler-btn" class="navbar-toggler" type="button" data-toggle="collapse"
  59. data-target="#navbarSupportedContent"
  60. aria-controls="navbarSupportedContent" aria-expanded="false" aria-label="Toggle navigation">
  61. <div class="animated-icon"><span></span><span></span><span></span></div>
  62. </button>
  63. <!-- Collapsible content -->
  64. <div class="collapse navbar-collapse" id="navbarSupportedContent">
  65. <ul class="navbar-nav ml-auto text-center">
  66. <li class="nav-item">
  67. <a class="nav-link" href="/">
  68. <i class="iconfont icon-home-fill"></i>
  69. <span>Home</span>
  70. </a>
  71. </li>
  72. <li class="nav-item">
  73. <a class="nav-link" href="/archives/">
  74. <i class="iconfont icon-archive-fill"></i>
  75. <span>Archives</span>
  76. </a>
  77. </li>
  78. <li class="nav-item" id="search-btn">
  79. <a class="nav-link" target="_self" href="javascript:;" data-toggle="modal" data-target="#modalSearch" aria-label="Search">
  80. <i class="iconfont icon-search"></i>
  81. </a>
  82. </li>
  83. <li class="nav-item" id="color-toggle-btn">
  84. <a class="nav-link" target="_self" href="javascript:;" aria-label="Color Toggle">
  85. <i class="iconfont icon-dark" id="color-toggle-icon"></i>
  86. </a>
  87. </li>
  88. </ul>
  89. </div>
  90. </div>
  91. </nav>
  92. <div id="banner" class="banner" parallax=true
  93. style="background: url('https://img.limour.top/2023/08/29/64ee08e108638.webp') no-repeat center center; background-size: cover;">
  94. <div class="full-bg-img">
  95. <div class="mask flex-center" style="background-color: rgba(0, 0, 0, 0.3)">
  96. <div class="banner-text text-center fade-in-up">
  97. <div class="h2">
  98. <span id="subtitle" data-typed-text="基于Chroma搭建个人知识库的全文索引"></span>
  99. </div>
  100. <div class="mt-3">
  101. <span class="post-meta">
  102. <i class="iconfont icon-date-fill" aria-hidden="true"></i>
  103. <time datetime="2023-04-26 23:22" pubdate>
  104. April 26, 2023 pm
  105. </time>
  106. </span>
  107. </div>
  108. <div class="mt-1">
  109. <span class="post-meta mr-2">
  110. <i class="iconfont icon-chart"></i>
  111. 4.7k words
  112. </span>
  113. <span class="post-meta mr-2">
  114. <i class="iconfont icon-clock-fill"></i>
  115. 40 mins
  116. </span>
  117. </div>
  118. </div>
  119. </div>
  120. </div>
  121. </div>
  122. </div>
  123. </header>
  124. <main>
  125. <div class="container-fluid nopadding-x">
  126. <div class="row nomargin-x">
  127. <div class="side-col d-none d-lg-block col-lg-2">
  128. </div>
  129. <div class="col-lg-8 nopadding-x-md">
  130. <div class="container nopadding-x-md" id="board-ctn">
  131. <div id="board">
  132. <article class="post-content mx-auto">
  133. <h1 id="seo-header">基于Chroma搭建个人知识库的全文索引</h1>
  134. <div class="markdown-body">
  135. <p>Chroma是一个可以帮助计算机理解文本的工具。它可以让你把文本放到一个“盒子”里,这个“盒子”可以让计算机更容易地找到和理解文本。你可以用它来创建一个文本库,然后通过输入问题,找到和问题相关的文本。比如,你可以创建一个文本库,里面有许多关于历史的文章,然后你可以输入“什么是古代中国的四大发明”,Chroma就可以帮你找到相关的文章。Chroma还有很多其他的功能,可以让你更方便地管理和搜索文本。它是完全免费和开放的,任何人都可以使用它。</p>
  136. <h2 id="构建Docker镜像"><a href="#构建Docker镜像" class="headerlink" title="构建Docker镜像"></a>构建Docker镜像</h2><figure class="highlight dockerfile"><table><tr><td class="gutter"><pre><span class="line">1</span><br><span class="line">2</span><br><span class="line">3</span><br><span class="line">4</span><br><span class="line">5</span><br><span class="line">6</span><br><span class="line">7</span><br></pre></td><td class="code"><pre><code class="hljs Dockerfile"><span class="hljs-keyword">FROM</span> python:<span class="hljs-number">3.10</span><br><span class="hljs-keyword">WORKDIR</span><span class="language-bash"> /chroma</span><br><span class="hljs-keyword">COPY</span><span class="language-bash"> ./chroma/requirements.txt requirements.txt</span><br><span class="hljs-keyword">RUN</span><span class="language-bash"> pip install --no-cache-dir --upgrade -r requirements.txt -i https://pypi.tuna.tsinghua.edu.cn/simple</span><br><span class="hljs-keyword">COPY</span><span class="language-bash"> ./chroma/bin/docker_entrypoint.sh /docker_entrypoint.sh</span><br><span class="hljs-keyword">COPY</span><span class="language-bash"> ./chroma /chroma</span><br><span class="hljs-keyword">CMD</span><span class="language-bash"> [<span class="hljs-string">&quot;/docker_entrypoint.sh&quot;</span>]</span><br></code></pre></td></tr></table></figure>
  137. <ul>
  138. <li>mkdir -p ~&#x2F;app&#x2F;chroma &amp;&amp; cd ~&#x2F;app&#x2F;chroma &amp;&amp; nano Dockerfile &amp;&amp; nano docker-compose.yml</li>
  139. <li>git clone –depth&#x3D;1 <a target="_blank" rel="noopener" href="https://ghproxy.com/https://github.com/chroma-core/chroma.git">https://ghproxy.com/https://github.com/chroma-core/chroma.git</a></li>
  140. <li>sudo docker build -t limour&#x2F;chroma .</li>
  141. <li>cp .&#x2F;chroma&#x2F;bin&#x2F;docker_entrypoint.sh .&#x2F;docker_entrypoint.sh</li>
  142. <li>nano .&#x2F;docker_entrypoint.sh 添加上pip镜像 -i <a target="_blank" rel="noopener" href="https://pypi.tuna.tsinghua.edu.cn/simple">https://pypi.tuna.tsinghua.edu.cn/simple</a></li>
  143. </ul>
  144. <h2 id="部署Docker镜像"><a href="#部署Docker镜像" class="headerlink" title="部署Docker镜像"></a>部署Docker镜像</h2><figure class="highlight yml"><table><tr><td class="gutter"><pre><span class="line">1</span><br><span class="line">2</span><br><span class="line">3</span><br><span class="line">4</span><br><span class="line">5</span><br><span class="line">6</span><br><span class="line">7</span><br><span class="line">8</span><br><span class="line">9</span><br><span class="line">10</span><br><span class="line">11</span><br><span class="line">12</span><br><span class="line">13</span><br><span class="line">14</span><br><span class="line">15</span><br><span class="line">16</span><br><span class="line">17</span><br><span class="line">18</span><br><span class="line">19</span><br><span class="line">20</span><br><span class="line">21</span><br><span class="line">22</span><br><span class="line">23</span><br><span class="line">24</span><br><span class="line">25</span><br><span class="line">26</span><br><span class="line">27</span><br><span class="line">28</span><br><span class="line">29</span><br><span class="line">30</span><br><span class="line">31</span><br><span class="line">32</span><br><span class="line">33</span><br><span class="line">34</span><br><span class="line">35</span><br><span class="line">36</span><br><span class="line">37</span><br><span class="line">38</span><br><span class="line">39</span><br><span class="line">40</span><br><span class="line">41</span><br><span class="line">42</span><br><span class="line">43</span><br></pre></td><td class="code"><pre><code class="hljs yml"><span class="hljs-attr">version:</span> <span class="hljs-string">&#x27;3.9&#x27;</span><br><br><span class="hljs-attr">networks:</span><br> <span class="hljs-attr">net:</span><br> <span class="hljs-attr">driver:</span> <span class="hljs-string">bridge</span><br><br><span class="hljs-attr">services:</span><br> <span class="hljs-attr">server:</span><br> <span class="hljs-attr">image:</span> <span class="hljs-string">limour/chroma</span><br> <span class="hljs-attr">restart:</span> <span class="hljs-string">always</span><br> <span class="hljs-attr">volumes:</span><br> <span class="hljs-bullet">-</span> <span class="hljs-string">./chroma:/chroma</span><br> <span class="hljs-bullet">-</span> <span class="hljs-string">./index_data:/index_data</span><br> <span class="hljs-bullet">-</span> <span class="hljs-string">./docker_entrypoint.sh:/docker_entrypoint.sh</span><br> <span class="hljs-attr">command:</span> <span class="hljs-string">uvicorn</span> <span class="hljs-string">chromadb.app:app</span> <span class="hljs-string">--reload</span> <span class="hljs-string">--workers</span> <span class="hljs-number">1</span> <span class="hljs-string">--host</span> <span class="hljs-number">0.0</span><span class="hljs-number">.0</span><span class="hljs-number">.0</span> <span class="hljs-string">--port</span> <span class="hljs-number">8000</span> <span class="hljs-string">--log-config</span> <span class="hljs-string">log_config.yml</span><br> <span class="hljs-attr">environment:</span><br> <span class="hljs-bullet">-</span> <span class="hljs-string">CHROMA_DB_IMPL=clickhouse</span><br> <span class="hljs-bullet">-</span> <span class="hljs-string">CLICKHOUSE_HOST=clickhouse</span><br> <span class="hljs-bullet">-</span> <span class="hljs-string">CLICKHOUSE_PORT=8123</span><br> <span class="hljs-attr">ports:</span><br> <span class="hljs-bullet">-</span> <span class="hljs-number">5800</span><span class="hljs-string">:8000</span><br> <span class="hljs-attr">depends_on:</span><br> <span class="hljs-bullet">-</span> <span class="hljs-string">clickhouse</span><br> <span class="hljs-attr">networks:</span><br> <span class="hljs-bullet">-</span> <span class="hljs-string">net</span><br><br> <span class="hljs-attr">clickhouse:</span><br> <span class="hljs-attr">image:</span> <span class="hljs-string">clickhouse/clickhouse-server:22.9-alpine</span><br> <span class="hljs-attr">restart:</span> <span class="hljs-string">always</span><br> <span class="hljs-attr">environment:</span><br> <span class="hljs-bullet">-</span> <span class="hljs-string">ALLOW_EMPTY_PASSWORD=yes</span><br> <span class="hljs-bullet">-</span> <span class="hljs-string">CLICKHOUSE_TCP_PORT=9000</span><br> <span class="hljs-bullet">-</span> <span class="hljs-string">CLICKHOUSE_HTTP_PORT=8123</span><br> <span class="hljs-attr">ports:</span><br> <span class="hljs-bullet">-</span> <span class="hljs-string">&#x27;8123:8123&#x27;</span><br> <span class="hljs-bullet">-</span> <span class="hljs-string">&#x27;9000:9000&#x27;</span><br> <span class="hljs-attr">volumes:</span><br> <span class="hljs-bullet">-</span> <span class="hljs-string">./clickhouse_data:/bitnami/clickhouse</span><br> <span class="hljs-bullet">-</span> <span class="hljs-string">./backups:/backups</span><br> <span class="hljs-bullet">-</span> <span class="hljs-string">./chroma/config/backup_disk.xml:/etc/clickhouse-server/config.d/backup_disk.xml</span><br> <span class="hljs-bullet">-</span> <span class="hljs-string">./chroma/config/chroma_users.xml:/etc/clickhouse-server/users.d/chroma.xml</span><br> <span class="hljs-attr">networks:</span><br> <span class="hljs-bullet">-</span> <span class="hljs-string">net</span><br></code></pre></td></tr></table></figure>
  145. <ul>
  146. <li>nano docker-compose.yml</li>
  147. <li>sudo docker-compose up -d</li>
  148. <li>sudo docker-compose logs</li>
  149. </ul>
  150. <h2 id="安装客户端"><a href="#安装客户端" class="headerlink" title="安装客户端"></a>安装客户端</h2><ul>
  151. <li>conda create -n chroma -c conda-forge python&#x3D;3.10 -y</li>
  152. <li>conda activate chroma</li>
  153. <li>pip install chromadb -i <a target="_blank" rel="noopener" href="https://pypi.tuna.tsinghua.edu.cn/simple">https://pypi.tuna.tsinghua.edu.cn/simple</a></li>
  154. <li>conda install -c conda-forge ipykernel -y</li>
  155. <li>python -m ipykernel install –user –name python-chroma</li>
  156. <li>更简单的:# conda create -n chroma -c conda-forge chromadb -y</li>
  157. </ul>
  158. <h2 id="测试用例"><a href="#测试用例" class="headerlink" title="测试用例"></a>测试用例</h2><figure class="highlight python"><table><tr><td class="gutter"><pre><span class="line">1</span><br><span class="line">2</span><br><span class="line">3</span><br><span class="line">4</span><br><span class="line">5</span><br><span class="line">6</span><br><span class="line">7</span><br><span class="line">8</span><br><span class="line">9</span><br><span class="line">10</span><br><span class="line">11</span><br><span class="line">12</span><br><span class="line">13</span><br><span class="line">14</span><br><span class="line">15</span><br><span class="line">16</span><br><span class="line">17</span><br><span class="line">18</span><br><span class="line">19</span><br><span class="line">20</span><br><span class="line">21</span><br><span class="line">22</span><br><span class="line">23</span><br><span class="line">24</span><br><span class="line">25</span><br><span class="line">26</span><br><span class="line">27</span><br><span class="line">28</span><br><span class="line">29</span><br><span class="line">30</span><br><span class="line">31</span><br><span class="line">32</span><br><span class="line">33</span><br><span class="line">34</span><br><span class="line">35</span><br><span class="line">36</span><br><span class="line">37</span><br><span class="line">38</span><br><span class="line">39</span><br><span class="line">40</span><br><span class="line">41</span><br><span class="line">42</span><br><span class="line">43</span><br><span class="line">44</span><br><span class="line">45</span><br><span class="line">46</span><br><span class="line">47</span><br><span class="line">48</span><br><span class="line">49</span><br><span class="line">50</span><br><span class="line">51</span><br><span class="line">52</span><br><span class="line">53</span><br><span class="line">54</span><br></pre></td><td class="code"><pre><code class="hljs python"><span class="hljs-keyword">import</span> chromadb<br><span class="hljs-keyword">from</span> chromadb.config <span class="hljs-keyword">import</span> Settings<br> <br>chroma_client = chromadb.Client(Settings(chroma_api_impl=<span class="hljs-string">&quot;rest&quot;</span>,<br> chroma_server_host=<span class="hljs-string">&quot;172.17.0.1&quot;</span>,<br> chroma_server_http_port=<span class="hljs-string">&quot;5800&quot;</span>,<br> chroma_server_ssl_enabled=<span class="hljs-literal">False</span><br> ))<br>collection = chroma_client.get_or_create_collection(name=<span class="hljs-string">&quot;test&quot;</span>)<br> <br>test_documents = [<br> <span class="hljs-string">&quot;长城:中国的标志性建筑之一,是世界上最长的城墙,也是中国古代的军事防御工程,被誉为世界七大奇迹之一。&quot;</span>,<br> <span class="hljs-string">&#x27;故宫:位于北京市中心,是明清两代的皇宫,也是中国最著名的古建筑之一,被誉为“中华民族的瑰宝”。&#x27;</span>,<br> <span class="hljs-string">&quot;大雁塔:位于中国古都西安市,是一座古代佛教文化遗产,建于唐朝,是中国古代建筑艺术的杰出代表。&quot;</span><br>]<br>collection.add(<br> documents = test_documents,<br> metadatas = [&#123;<span class="hljs-string">&quot;chapter&quot;</span>: <span class="hljs-string">&quot;3&quot;</span>, <span class="hljs-string">&quot;verse&quot;</span>: <span class="hljs-string">&quot;16&quot;</span>&#125;, &#123;<span class="hljs-string">&quot;chapter&quot;</span>: <span class="hljs-string">&quot;3&quot;</span>, <span class="hljs-string">&quot;verse&quot;</span>: <span class="hljs-string">&quot;5&quot;</span>&#125;, &#123;<span class="hljs-string">&quot;chapter&quot;</span>: <span class="hljs-string">&quot;29&quot;</span>, <span class="hljs-string">&quot;verse&quot;</span>: <span class="hljs-string">&quot;11&quot;</span>&#125;],<br> ids = [<span class="hljs-string">&quot;id1&quot;</span>, <span class="hljs-string">&quot;id2&quot;</span>, <span class="hljs-string">&quot;id3&quot;</span>]<br>)<br> <br>collection.query(<br> query_texts=[<span class="hljs-string">&quot;长城是哪个朝代修建的?&quot;</span>],<br> n_results=<span class="hljs-number">1</span><br>)<br><span class="hljs-comment"># &#123;&#x27;ids&#x27;: [[&#x27;id1&#x27;]],</span><br> <span class="hljs-comment"># &#x27;embeddings&#x27;: None,</span><br> <span class="hljs-comment"># &#x27;documents&#x27;: [[&#x27;长城:中国的标志性建筑之一,是世界上最长的城墙,也是中国古代的军事防御工程,被誉为世界七大奇迹之一。&#x27;]],</span><br> <span class="hljs-comment"># &#x27;metadatas&#x27;: [[&#123;&#x27;chapter&#x27;: &#x27;3&#x27;, &#x27;verse&#x27;: &#x27;16&#x27;&#125;]],</span><br> <span class="hljs-comment"># &#x27;distances&#x27;: [[0.6134731769561768]]&#125;</span><br> <br>collection.query(<br> query_texts=[<span class="hljs-string">&quot;在中国历史上,哪位皇帝曾经居住在位于北京市中心的那座古代宫殿?&quot;</span>],<br> n_results=<span class="hljs-number">1</span><br>)<br><span class="hljs-comment"># &#123;&#x27;ids&#x27;: [[&#x27;id2&#x27;]],</span><br> <span class="hljs-comment"># &#x27;embeddings&#x27;: None,</span><br> <span class="hljs-comment"># &#x27;documents&#x27;: [[&#x27;故宫:位于北京市中心,是明清两代的皇宫,也是中国最著名的古建筑之一,被誉为“中华民族的瑰宝”。&#x27;]],</span><br> <span class="hljs-comment"># &#x27;metadatas&#x27;: [[&#123;&#x27;chapter&#x27;: &#x27;3&#x27;, &#x27;verse&#x27;: &#x27;5&#x27;&#125;]],</span><br> <span class="hljs-comment"># &#x27;distances&#x27;: [[0.4222669303417206]]&#125;</span><br> <br>collection.query(<br> query_texts=[<span class="hljs-string">&quot;营造法式&quot;</span>],<br> n_results=<span class="hljs-number">3</span><br>)<br><span class="hljs-comment"># &#123;&#x27;ids&#x27;: [[&#x27;id2&#x27;, &#x27;id3&#x27;, &#x27;id1&#x27;]],</span><br> <span class="hljs-comment"># &#x27;embeddings&#x27;: None,</span><br> <span class="hljs-comment"># &#x27;documents&#x27;: [[&#x27;故宫:位于北京市中心,是明清两代的皇宫,也是中国最著名的古建筑之一,被誉为“中华民族的瑰宝”。&#x27;,</span><br> <span class="hljs-comment"># &#x27;大雁塔:位于中国古都西安市,是一座古代佛教文化遗产,建于唐朝,是中国古代建筑艺术的杰出代表。&#x27;,</span><br> <span class="hljs-comment"># &#x27;长城:中国的标志性建筑之一,是世界上最长的城墙,也是中国古代的军事防御工程,被誉为世界七大奇迹之一。&#x27;]],</span><br> <span class="hljs-comment"># &#x27;metadatas&#x27;: [[&#123;&#x27;chapter&#x27;: &#x27;3&#x27;, &#x27;verse&#x27;: &#x27;5&#x27;&#125;,</span><br> <span class="hljs-comment"># &#123;&#x27;chapter&#x27;: &#x27;29&#x27;, &#x27;verse&#x27;: &#x27;11&#x27;&#125;,</span><br> <span class="hljs-comment"># &#123;&#x27;chapter&#x27;: &#x27;3&#x27;, &#x27;verse&#x27;: &#x27;16&#x27;&#125;]],</span><br> <span class="hljs-comment"># &#x27;distances&#x27;: [[1.073906660079956, 1.2695903778076172, 1.2703778743743896]]&#125;</span><br></code></pre></td></tr></table></figure>
  159. <ul>
  160. <li>sudo docker-compose restart 测试持久化</li>
  161. </ul>
  162. </div>
  163. <hr/>
  164. <div>
  165. <div class="post-metas my-3">
  166. <div class="post-meta mr-3 d-flex align-items-center">
  167. <i class="iconfont icon-category"></i>
  168. <span class="category-chains">
  169. <span class="category-chain">
  170. <a href="/categories/AIGC/" class="category-chain-item">AIGC</a>
  171. </span>
  172. <span class="category-chain">
  173. <a href="/categories/%E5%BC%80%E6%BA%90/" class="category-chain-item">开源</a>
  174. </span>
  175. </span>
  176. </div>
  177. </div>
  178. <div class="license-box my-3">
  179. <div class="license-title">
  180. <div>基于Chroma搭建个人知识库的全文索引</div>
  181. <div>https://occdn.limour.top/2714.html</div>
  182. </div>
  183. <div class="license-meta">
  184. <div class="license-meta-item">
  185. <div>Author</div>
  186. <div>Limour</div>
  187. </div>
  188. <div class="license-meta-item license-meta-date">
  189. <div>Posted on</div>
  190. <div>April 26, 2023</div>
  191. </div>
  192. <div class="license-meta-item">
  193. <div>Licensed under</div>
  194. <div>
  195. <a class="print-no-link" target="_blank" href="https://creativecommons.org/licenses/by-nc-sa/4.0/">
  196. <span class="hint--top hint--rounded" aria-label="BY - Attribution">
  197. <i class="iconfont icon-by"></i>
  198. </span>
  199. </a>
  200. <a class="print-no-link" target="_blank" href="https://creativecommons.org/licenses/by-nc-sa/4.0/">
  201. <span class="hint--top hint--rounded" aria-label="NC - Non-commercial">
  202. <i class="iconfont icon-nc"></i>
  203. </span>
  204. </a>
  205. <a class="print-no-link" target="_blank" href="https://creativecommons.org/licenses/by-nc-sa/4.0/">
  206. <span class="hint--top hint--rounded" aria-label="SA - Share-alike">
  207. <i class="iconfont icon-sa"></i>
  208. </span>
  209. </a>
  210. </div>
  211. </div>
  212. </div>
  213. <div class="license-icon iconfont"></div>
  214. </div>
  215. <div class="post-prevnext my-3">
  216. <article class="post-prev col-6">
  217. <a href="/2718.html" title="【架空】基于反物质本位币的未来货币体系设计">
  218. <i class="iconfont icon-arrowleft"></i>
  219. <span class="hidden-mobile">【架空】基于反物质本位币的未来货币体系设计</span>
  220. <span class="visible-mobile">Previous</span>
  221. </a>
  222. </article>
  223. <article class="post-next col-6">
  224. <a href="/2710.html" title="搭建自己的GPT之vicuna">
  225. <span class="hidden-mobile">搭建自己的GPT之vicuna</span>
  226. <span class="visible-mobile">Next</span>
  227. <i class="iconfont icon-arrowright"></i>
  228. </a>
  229. </article>
  230. </div>
  231. </div>
  232. <article id="comments" lazyload>
  233. <div id="waline"></div>
  234. <script type="text/javascript">
  235. Fluid.utils.loadComments('#waline', function() {
  236. Fluid.utils.createCssLink('https://cdn.staticfile.org/waline/2.15.5/waline.min.css')
  237. Fluid.utils.createScript('https://cdn.staticfile.org/waline/2.15.5/waline.min.js', function() {
  238. var options = Object.assign(
  239. {"serverURL":"https://comments.limour.top","path":"window.location.pathname","meta":["nick","mail","link"],"requiredMeta":["nick"],"lang":"zh-CN","emoji":["https://jscdn.limour.top/gh/walinejs/emojis/weibo"],"dark":"html[data-user-color-scheme=\"dark\"]","wordLimit":0,"pageSize":10},
  240. {
  241. el: '#waline',
  242. path: window.location.pathname
  243. }
  244. )
  245. Waline.init(options);
  246. Fluid.utils.waitElementVisible('#waline .vcontent', () => {
  247. var imgSelector = '#waline .vcontent img:not(.vemoji)';
  248. Fluid.plugins.imageCaption(imgSelector);
  249. Fluid.plugins.fancyBox(imgSelector);
  250. })
  251. });
  252. });
  253. </script>
  254. <noscript>Please enable JavaScript to view the comments</noscript>
  255. </article>
  256. </article>
  257. </div>
  258. </div>
  259. </div>
  260. <div class="side-col d-none d-lg-block col-lg-2">
  261. <aside class="sidebar" style="margin-left: -1rem">
  262. <div id="toc">
  263. <p class="toc-header">
  264. <i class="iconfont icon-list"></i>
  265. <span>Table of Contents</span>
  266. </p>
  267. <div class="toc-body" id="toc-body"></div>
  268. </div>
  269. </aside>
  270. </div>
  271. </div>
  272. </div>
  273. <a id="scroll-top-button" aria-label="TOP" href="#" role="button">
  274. <i class="iconfont icon-arrowup" aria-hidden="true"></i>
  275. </a>
  276. <div class="modal fade" id="modalSearch" tabindex="-1" role="dialog" aria-labelledby="ModalLabel"
  277. aria-hidden="true">
  278. <div class="modal-dialog modal-dialog-scrollable modal-lg" role="document">
  279. <div class="modal-content">
  280. <div class="modal-header text-center">
  281. <h4 class="modal-title w-100 font-weight-bold">Search</h4>
  282. <button type="button" id="local-search-close" class="close" data-dismiss="modal" aria-label="Close">
  283. <span aria-hidden="true">&times;</span>
  284. </button>
  285. </div>
  286. <div class="modal-body mx-3">
  287. <div class="md-form mb-5">
  288. <input type="text" id="local-search-input" class="form-control validate">
  289. <label data-error="x" data-success="v" for="local-search-input">Keyword</label>
  290. </div>
  291. <div class="list-group" id="local-search-result"></div>
  292. </div>
  293. </div>
  294. </div>
  295. </div>
  296. </main>
  297. <footer>
  298. <div class="footer-inner">
  299. <div class="footer-content">
  300. <a target="_blank" rel="nofollow noopener" href="http://www.beian.gov.cn/portal/registerSystemInfo?recordcode=43130202000203"><img src="https://img.limour.top/2023/08/27/64eadeb81d6a0.webp" srcset="https://jscdn.limour.top/gh/Limour-dev/Sakurairo_Vision/load_svg/inload.svg" lazyload>湘公网安备 43130202000203号 </a> <a target="_blank" rel="nofollow noopener" href="https://beian.miit.gov.cn/">湘ICP备20008299号 </a> <a target="_blank" rel="nofollow noopener" href="https://icp.gov.moe/?keyword=20210128">萌ICP备20210128号</a> <br> <a href="https://www.foreverblog.cn/" target="_blank"> <img src="https://img.foreverblog.cn/logo_en_default.png" srcset="https://jscdn.limour.top/gh/Limour-dev/Sakurairo_Vision/load_svg/inload.svg" lazyload alt="" style="width:auto;height:24px"> </a> <br> <a href="https://hexo.io" target="_blank" rel="nofollow noopener"><span>Hexo</span></a> <i class="iconfont icon-love"></i> <a href="https://github.com/fluid-dev/hexo-theme-fluid" target="_blank" rel="nofollow noopener"><span>Fluid</span></a> <i class="iconfont icon-love"></i> <a href="https://github.com/limour-blog/archives-occdn" target="_blank" rel="nofollow noopener"><span>SRC</span></a>
  301. </div>
  302. </div>
  303. </footer>
  304. <!-- Scripts -->
  305. <script src="https://jscdn.limour.top/npm/nprogress@0.2.0/nprogress.min.js" ></script>
  306. <link rel="stylesheet" href="https://jscdn.limour.top/npm/nprogress@0.2.0/nprogress.min.css" />
  307. <script>
  308. NProgress.configure({"showSpinner":false,"trickleSpeed":100})
  309. NProgress.start()
  310. window.addEventListener('load', function() {
  311. NProgress.done();
  312. })
  313. </script>
  314. <script src="https://jscdn.limour.top/npm/jquery@3.6.4/dist/jquery.min.js" ></script>
  315. <script src="https://jscdn.limour.top/npm/bootstrap@4.6.1/dist/js/bootstrap.min.js" ></script>
  316. <script src="/js/events.js" ></script>
  317. <script src="/js/plugins.js" ></script>
  318. <script src="https://lib.baomitu.com/typed.js/2.0.12/typed.min.js" ></script>
  319. <script>
  320. (function (window, document) {
  321. var typing = Fluid.plugins.typing;
  322. var subtitle = document.getElementById('subtitle');
  323. if (!subtitle || !typing) {
  324. return;
  325. }
  326. var text = subtitle.getAttribute('data-typed-text');
  327. typing(text);
  328. })(window, document);
  329. </script>
  330. <script src="/js/img-lazyload.js" ></script>
  331. <script>
  332. Fluid.utils.createScript('https://jscdn.limour.top/npm/tocbot@4.20.1/dist/tocbot.min.js', function() {
  333. var toc = jQuery('#toc');
  334. if (toc.length === 0 || !window.tocbot) { return; }
  335. var boardCtn = jQuery('#board-ctn');
  336. var boardTop = boardCtn.offset().top;
  337. window.tocbot.init(Object.assign({
  338. tocSelector : '#toc-body',
  339. contentSelector : '.markdown-body',
  340. linkClass : 'tocbot-link',
  341. activeLinkClass : 'tocbot-active-link',
  342. listClass : 'tocbot-list',
  343. isCollapsedClass: 'tocbot-is-collapsed',
  344. collapsibleClass: 'tocbot-is-collapsible',
  345. scrollSmooth : true,
  346. includeTitleTags: true,
  347. headingsOffset : -boardTop,
  348. }, CONFIG.toc));
  349. if (toc.find('.toc-list-item').length > 0) {
  350. toc.css('visibility', 'visible');
  351. }
  352. Fluid.events.registerRefreshCallback(function() {
  353. if ('tocbot' in window) {
  354. tocbot.refresh();
  355. var toc = jQuery('#toc');
  356. if (toc.length === 0 || !tocbot) {
  357. return;
  358. }
  359. if (toc.find('.toc-list-item').length > 0) {
  360. toc.css('visibility', 'visible');
  361. }
  362. }
  363. });
  364. });
  365. </script>
  366. <script src=https://lib.baomitu.com/clipboard.js/2.0.11/clipboard.min.js></script>
  367. <script>Fluid.plugins.codeWidget();</script>
  368. <script>
  369. Fluid.utils.createScript('https://jscdn.limour.top/npm/anchor-js@4.3.1/anchor.min.js', function() {
  370. window.anchors.options = {
  371. placement: CONFIG.anchorjs.placement,
  372. visible : CONFIG.anchorjs.visible
  373. };
  374. if (CONFIG.anchorjs.icon) {
  375. window.anchors.options.icon = CONFIG.anchorjs.icon;
  376. }
  377. var el = (CONFIG.anchorjs.element || 'h1,h2,h3,h4,h5,h6').split(',');
  378. var res = [];
  379. for (var item of el) {
  380. res.push('.markdown-body > ' + item.trim());
  381. }
  382. if (CONFIG.anchorjs.placement === 'left') {
  383. window.anchors.options.class = 'anchorjs-link-left';
  384. }
  385. window.anchors.add(res.join(', '));
  386. Fluid.events.registerRefreshCallback(function() {
  387. if ('anchors' in window) {
  388. anchors.removeAll();
  389. var el = (CONFIG.anchorjs.element || 'h1,h2,h3,h4,h5,h6').split(',');
  390. var res = [];
  391. for (var item of el) {
  392. res.push('.markdown-body > ' + item.trim());
  393. }
  394. if (CONFIG.anchorjs.placement === 'left') {
  395. anchors.options.class = 'anchorjs-link-left';
  396. }
  397. anchors.add(res.join(', '));
  398. }
  399. });
  400. });
  401. </script>
  402. <script>
  403. Fluid.utils.createScript('https://lib.baomitu.com/fancybox/3.5.7/jquery.fancybox.min.js', function() {
  404. Fluid.plugins.fancyBox();
  405. });
  406. </script>
  407. <script>Fluid.plugins.imageCaption();</script>
  408. <script src="/js/local-search.js" ></script>
  409. <!-- 主题的启动项,将它保持在最底部 -->
  410. <!-- the boot of the theme, keep it at the bottom -->
  411. <script src="/js/boot.js" ></script>
  412. <noscript>
  413. <div class="noscript-warning">Blog works best with JavaScript enabled</div>
  414. </noscript>
  415. <!-- hexo injector body_end start -->
  416. <script defer src="/theme-inject/timeliness.js"></script>
  417. <!-- hexo injector body_end end --></body>
  418. </html>