├── .gitignore
├── .vscode
    └── settings.json
├── LICENCE
├── docker-compose.yml
├── fastapi
    ├── .langchain.db
    ├── Dockerfile
    ├── app
    │   ├── .env
    │   ├── __pycache__
    │   │   ├── main.cpython-310.pyc
    │   │   ├── main.cpython-311.pyc
    │   │   └── main.cpython-39.pyc
    │   └── main.py
    ├── gunicorn_conf.py
    ├── requirements.txt
    ├── start-reload.sh
    ├── start.sh
    └── submodules
    │   ├── __pycache__
    │       └── prompts.cpython-310.pyc
    │   └── prompts.py
├── qdrant
    └── Dockerfile
├── readme.md
└── sveltekit
    ├── .env
    ├── .gitignore
    ├── .npmrc
    ├── .prettierignore
    ├── .prettierrc
    ├── Dockerfile
    ├── README.md
    ├── package.json
    ├── playwright.config.ts
    ├── postcss.config.cjs
    ├── src
        ├── app.css
        ├── app.d.ts
        ├── app.html
        ├── hooks.server.ts
        ├── index.test.ts
        ├── lib
        │   ├── components
        │   │   ├── PrismJS.svelte
        │   │   ├── chatbot.svelte
        │   │   └── chatbotstream.svelte
        │   ├── conversationStore.ts
        │   └── streamStore.ts
        └── routes
        │   ├── +layout.server.ts
        │   ├── +layout.svelte
        │   ├── +page.server.ts
        │   ├── +page.svelte
        │   ├── api
        │       └── queryGPT
        │       │   └── +server.ts
        │   ├── collection
        │       └── [collection]
        │       │   ├── +page.server.ts
        │       │   └── +page.svelte
        │   ├── document
        │       └── [collection]
        │       │   ├── +page.server.ts
        │       │   └── +page.svelte
        │   └── robots.txt
        │       └── +server.ts
    ├── static
        ├── favicon.png
        └── profile-image.png
    ├── svelte.config.js
    ├── tailwind.config.cjs
    ├── tests
        └── test.ts
    ├── tsconfig.json
    └── vite.config.ts


/.gitignore:
--------------------------------------------------------------------------------
1 | fastapi/__pycache__
2 | sveltekit/.svelte-kit
3 | sveltekit/node_modules
4 | azure-devops-pipeline.yml
5 | docker-pipeline.yml
6 | fastapi/.env
7 | # fastapi/app/.env
8 | fastapi/app/.env
9 | 


--------------------------------------------------------------------------------
/.vscode/settings.json:
--------------------------------------------------------------------------------
1 | {
2 | 	"python.formatting.provider": "black"
3 | }


--------------------------------------------------------------------------------
/LICENCE:
--------------------------------------------------------------------------------
 1 | MIT License
 2 | 
 3 | Copyright (c) 2023 Dag Thomas Olsen
 4 | 
 5 | Permission is hereby granted, free of charge, to any person obtaining a copy
 6 | of this software and associated documentation files (the "Software"), to deal
 7 | in the Software without restriction, including without limitation the rights
 8 | to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
 9 | copies of the Software, and to permit persons to whom the Software is
10 | furnished to do so, subject to the following conditions:
11 | 
12 | The above copyright notice and this permission notice shall be included in all
13 | copies or substantial portions of the Software.
14 | 
15 | THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 | IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 | FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
18 | AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 | LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20 | OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
21 | SOFTWARE.
22 | 


--------------------------------------------------------------------------------
/docker-compose.yml:
--------------------------------------------------------------------------------
 1 | version: "3.10"
 2 | networks:
 3 |   app-tier:
 4 |     driver: bridge
 5 | services:
 6 |   fastapi:
 7 |     build: ./fastapi
 8 |     expose:
 9 |       - "5000"
10 |     ports:
11 |       - "5000:5000"
12 |     environment:
13 |       - QDRANT_HOST=qdrant
14 |     depends_on:
15 |       - qdrant
16 |     networks:
17 |       - app-tier
18 |     volumes:
19 |       - ./fastapi:/app:Z
20 |   sveltekit:
21 |     build: ./sveltekit
22 |     ports:
23 |       - 3000:3000
24 |     networks:
25 |       - app-tier
26 |     depends_on:
27 |       - fastapi
28 |     volumes:
29 |       - ./sveltekit:/app:Z
30 |     environment:
31 |       - VITE_BACKEND_URL=http://localhost:5000
32 |   qdrant:
33 |     build: ./qdrant
34 |     ports:
35 |       - 6333:6333
36 |     volumes:
37 |       - ./data/qdrant_storage:/qdrant/storage
38 | 
39 |     networks:
40 |       - app-tier
41 | 
42 | volumes:
43 |   app-qdrant-data:


--------------------------------------------------------------------------------
/fastapi/.langchain.db:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/dagthomas/LangchainComposeChatYourDocs/b13915a6e395b006ad67668c822ddef71b570b16/fastapi/.langchain.db


--------------------------------------------------------------------------------
/fastapi/Dockerfile:
--------------------------------------------------------------------------------
 1 | FROM python:3.10-slim
 2 | 
 3 | COPY requirements.txt /tmp/requirements.txt
 4 | RUN pip install --no-cache-dir -r /tmp/requirements.txt
 5 | RUN apt-get update && apt-get install -y --no-install-recommends libmagic1 && rm -rf /var/lib/apt/lists/*
 6 | COPY ./start.sh /start.sh
 7 | RUN chmod +x /start.sh
 8 | 
 9 | COPY ./gunicorn_conf.py /gunicorn_conf.py
10 | 
11 | COPY ./start-reload.sh /start-reload.sh
12 | RUN chmod +x /start-reload.sh
13 | 
14 | COPY ./app /app
15 | WORKDIR /app/
16 | 
17 | ENV PYTHONPATH=/app
18 | 
19 | EXPOSE 5000:5000
20 | 
21 | # Run the start script, it will check for an /app/prestart.sh script (e.g. for migrations)
22 | # And then will start Gunicorn with Uvicorn
23 | CMD ["/start.sh"]


--------------------------------------------------------------------------------
/fastapi/app/.env:
--------------------------------------------------------------------------------
1 | OPENAI_API_KEY = sk-xxx
2 | AUTHORIZED_API_KEY = 5pBHDjr4bkNFc1xdqIMR6INLItKuPvZrf8zNdc6enlXqhy8qVO8YCYKRcdd
3 | APIFY_API_TOKEN = apify_api_xxx
4 | 
5 | 


--------------------------------------------------------------------------------
/fastapi/app/__pycache__/main.cpython-310.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/dagthomas/LangchainComposeChatYourDocs/b13915a6e395b006ad67668c822ddef71b570b16/fastapi/app/__pycache__/main.cpython-310.pyc


--------------------------------------------------------------------------------
/fastapi/app/__pycache__/main.cpython-311.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/dagthomas/LangchainComposeChatYourDocs/b13915a6e395b006ad67668c822ddef71b570b16/fastapi/app/__pycache__/main.cpython-311.pyc


--------------------------------------------------------------------------------
/fastapi/app/__pycache__/main.cpython-39.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/dagthomas/LangchainComposeChatYourDocs/b13915a6e395b006ad67668c822ddef71b570b16/fastapi/app/__pycache__/main.cpython-39.pyc


--------------------------------------------------------------------------------
/fastapi/app/main.py:
--------------------------------------------------------------------------------
  1 | import threading
  2 | import queue
  3 | import openai
  4 | import aiofiles
  5 | import langchain
  6 | from dotenv import load_dotenv
  7 | from pydantic import BaseModel
  8 | from qdrant_client import QdrantClient
  9 | import logging
 10 | from typing import List
 11 | import urllib3
 12 | import os
 13 | import tempfile
 14 | import sys
 15 | import magic
 16 | import pandas as pd
 17 | import typing as t
 18 | from slugify import slugify
 19 | 
 20 | # custom
 21 | import submodules.prompts as prompts
 22 | from langchain.schema import HumanMessage, SystemMessage
 23 | 
 24 | from langchain.document_loaders.base import Document
 25 | from langchain.document_loaders import ApifyDatasetLoader
 26 | from langchain.cache import InMemoryCache
 27 | from langchain.document_loaders import WebBaseLoader
 28 | from langchain.chat_models import ChatOpenAI
 29 | from langchain.document_loaders.csv_loader import CSVLoader
 30 | from langchain.document_loaders import SRTLoader
 31 | from langchain.document_loaders import UnstructuredWordDocumentLoader
 32 | from langchain.document_loaders import UnstructuredEPubLoader
 33 | from langchain.document_loaders import UnstructuredPowerPointLoader
 34 | from langchain.document_loaders import PyPDFLoader
 35 | from langchain.vectorstores import Qdrant
 36 | from langchain.text_splitter import RecursiveCharacterTextSplitter
 37 | from langchain.embeddings.openai import OpenAIEmbeddings
 38 | from langchain.chains.qa_with_sources import load_qa_with_sources_chain
 39 | from langchain.callbacks.base import CallbackManager
 40 | from langchain.callbacks.streaming_stdout import StreamingStdOutCallbackHandler
 41 | 
 42 | from fastapi import FastAPI, Depends, HTTPException, status, UploadFile, File
 43 | from fastapi.security.http import HTTPAuthorizationCredentials, HTTPBearer
 44 | from fastapi.responses import StreamingResponse
 45 | from fastapi.security import OAuth2PasswordBearer
 46 | from fastapi.middleware.cors import CORSMiddleware
 47 | 
 48 | 
 49 | langchain.llm_cache = InMemoryCache()
 50 | 
 51 | 
 52 | load_dotenv()
 53 | 
 54 | OPENAI_API_KEY = os.getenv("OPENAI_API_KEY")
 55 | AUTHORIZED_API_KEY = os.getenv("AUTHORIZED_API_KEY")
 56 | os.environ["APIFY_API_TOKEN"] = os.getenv("APIFY_API_TOKEN")
 57 | openai.api_key = OPENAI_API_KEY
 58 | 
 59 | host = "qdrant"
 60 | client = QdrantClient(host=host, prefer_grpc=True)
 61 | 
 62 | http = urllib3.PoolManager(cert_reqs="CERT_NONE", retries=False)
 63 | logging.captureWarnings(True)
 64 | get_bearer_token = HTTPBearer(auto_error=False)
 65 | # def bearer token auth
 66 | oauth2_scheme = OAuth2PasswordBearer(tokenUrl="token")
 67 | 
 68 | 
 69 | class UnauthorizedMessage(BaseModel):
 70 |     detail: str = "Bearer token missing or unknown"
 71 | 
 72 | 
 73 | known_tokens = set([AUTHORIZED_API_KEY])
 74 | 
 75 | 
 76 | async def get_token(
 77 |     auth: t.Optional[HTTPAuthorizationCredentials] = Depends(get_bearer_token),
 78 | ) -> str:
 79 |     # Simulate a database query to find a known token
 80 |     if auth is None or (token := auth.credentials) not in known_tokens:
 81 |         raise HTTPException(
 82 |             status_code=status.HTTP_401_UNAUTHORIZED,
 83 |             detail=UnauthorizedMessage().detail,
 84 |         )
 85 |     return token
 86 | 
 87 | 
 88 | # start app
 89 | app = FastAPI(
 90 |     title="LangChain Starter API",
 91 | )
 92 | 
 93 | origins = [
 94 |     "*",
 95 | ]
 96 | app.add_middleware(
 97 |     CORSMiddleware,
 98 |     allow_origins=origins,
 99 |     allow_credentials=True,
100 |     allow_methods=["*"],
101 |     allow_headers=["*"],
102 | )
103 | 
104 | 
105 | async def startup():
106 |     print("Server Startup!")
107 | 
108 | 
109 | class GPTQuery(BaseModel):
110 |     prompt: str
111 |     system_intel: str
112 |     temperature: float
113 | 
114 | 
115 | class Query(BaseModel):
116 |     query: str
117 |     collection: str
118 | 
119 | 
120 | class Apify(BaseModel):
121 |     dataset: str
122 |     collection: str
123 | 
124 | 
125 | class Collection(BaseModel):
126 |     collection: str
127 |     prompt: str
128 |     temperature: float
129 | 
130 | 
131 | class Webpage(BaseModel):
132 |     url: str
133 | 
134 | 
135 | class Webpages(BaseModel):
136 |     urls: List[str]
137 |     collection_name: str
138 | 
139 | 
140 | @app.get("/")
141 | async def read_root():
142 |     message = f"Hello world! From FastAPI running on Uvicorn with Gunicorn. Using Python {sys.version_info.major}.{sys.version_info.minor}"
143 |     return {message}
144 | 
145 | 
146 | # Fastapi endpoint for returning a list of collections
147 | 
148 | 
149 | @app.get("/collections")
150 | async def read_collections(token: str = Depends(get_token)):
151 |     data = client.get_collections()
152 |     return data.collections
153 | 
154 | 
155 | @app.post("/documents")
156 | async def create_item(item: Query, token: str = Depends(get_token)):
157 |     qdrant = Qdrant(
158 |         client, item.collection, embedding_function=OpenAIEmbeddings().embed_query
159 |     )
160 |     docs = qdrant.similarity_search_with_score(item.query)
161 |     return docs
162 | 
163 | 
164 | @app.post("/collections")
165 | async def create_item(item: Collection, token: str = Depends(get_token)):
166 |     qdrant = Qdrant(
167 |         client, item.collection, embedding_function=OpenAIEmbeddings().embed_query
168 |     )
169 |     docs = qdrant.similarity_search(item.prompt)
170 |     llm = ChatOpenAI(temperature=item.temperature, model_name="gpt-3.5-turbo")
171 |     #  , metadata_keys=['source']
172 |     chain = load_qa_with_sources_chain(llm, chain_type="stuff")
173 |     result = chain(
174 |         {"input_documents": docs, "question": item.prompt}, return_only_outputs=True
175 |     )
176 |     return result
177 | 
178 | 
179 | loader_classes = {
180 |     ".pdf": PyPDFLoader,
181 |     ".xls": CSVLoader,
182 |     ".xlsx": CSVLoader,
183 |     ".csv": CSVLoader,
184 |     ".epub": UnstructuredEPubLoader,
185 |     ".pptx": UnstructuredPowerPointLoader,
186 |     ".docx": UnstructuredWordDocumentLoader,
187 |     ".txt": SRTLoader,
188 |     ".srt": SRTLoader,
189 | }
190 | 
191 | 
192 | async def ingest_data(tmp_file, slug, file_type, chunk_size, chunk_overlap):
193 |     if file_type in loader_classes:
194 |         loader_class = loader_classes[file_type]
195 |         if loader_class == CSVLoader:
196 |             excel = pd.read_excel(tmp_file)
197 |             excel.to_csv(
198 |                 f"./files/{AUTHORIZED_API_KEY}/{slug}.csv", index=None, header=True
199 |             )
200 |         loader = loader_class(tmp_file)
201 |     else:
202 |         return "Filetype not supported"
203 |     documents = loader.load()
204 |     # cache the embeddings
205 |     if not hasattr(ingest_data, "embeddings"):
206 |         ingest_data.embeddings = OpenAIEmbeddings()
207 |     text_splitter = RecursiveCharacterTextSplitter(
208 |         chunk_size=chunk_size, chunk_overlap=chunk_overlap
209 |     )
210 |     print(documents)
211 |     docs = text_splitter.split_documents(documents)
212 |     Qdrant.from_documents(
213 |         docs, ingest_data.embeddings, host=host, collection_name=slug, prefer_grpc=True
214 |     )
215 |     return slug
216 | 
217 | 
218 | @app.post("/upload")
219 | async def upload_file(file: UploadFile = File(...), token: str = Depends(get_token)):
220 |     with tempfile.NamedTemporaryFile(delete=False) as tmp_file:
221 |         tmp_file.write(await file.read())
222 |         tmp_file_path = tmp_file.name
223 |     filetype = os.path.splitext(file.filename)
224 |     response = await ingest_data(
225 |         tmp_file_path,
226 |         slugify(os.path.splitext(file.filename)[0]),
227 |         filetype[1],
228 |         chunk_size=256,
229 |         chunk_overlap=40,
230 |     )
231 |     tmp_file.close()
232 |     os.unlink(tmp_file.name)
233 |     return response
234 | 
235 | 
236 | @app.post("/webpage")
237 | async def create_webpage(item: Webpage, token: str = Depends(get_token)):
238 |     collection_name = slugify(item.url.split("/")[-1])
239 |     loader = WebBaseLoader(item.url)
240 |     documents = loader.load()
241 |     text_splitter = RecursiveCharacterTextSplitter(chunk_size=250, chunk_overlap=40)
242 |     docs = text_splitter.split_documents(documents)
243 |     embeddings = OpenAIEmbeddings()
244 |     Qdrant.from_documents(
245 |         docs, embeddings, host=host, collection_name=collection_name, prefer_grpc=True
246 |     )
247 |     return collection_name
248 | 
249 | 
250 | @app.post("/webpages")
251 | async def create_webpages(item: Webpages, token: str = Depends(get_token)):
252 |     loader = WebBaseLoader(item.urls)
253 |     documents = loader.load()
254 |     text_splitter = RecursiveCharacterTextSplitter(chunk_size=250, chunk_overlap=40)
255 |     docs = text_splitter.split_documents(documents)
256 |     embeddings = OpenAIEmbeddings()
257 |     Qdrant.from_documents(
258 |         docs,
259 |         embeddings,
260 |         host=host,
261 |         collection_name=item.collection_name,
262 |         prefer_grpc=True,
263 |     )
264 | 
265 |     return item.collection_name
266 | 
267 | 
268 | @app.post("/openai")
269 | async def openai_query(item: GPTQuery, token: str = Depends(get_token)):
270 |     system_intel = item.system_intel
271 |     prompt = item.prompt
272 |     result = openai.ChatCompletion.create(
273 |         model="gpt-3.5-turbo",
274 |         temperature=item.temperature,
275 |         messages=[
276 |             {"role": "system", "content": system_intel},
277 |             {"role": "user", "content": prompt},
278 |         ],
279 |     )
280 | 
281 |     return result.choices[0].message.content
282 | 
283 | 
284 | @app.post("/apify")
285 | async def stream(item: Apify, token: str = Depends(get_token)):
286 |     loader = ApifyDatasetLoader(
287 |         dataset_id=item.dataset,
288 |         dataset_mapping_function=lambda dataset_item: Document(
289 |             page_content=dataset_item["aml_text"],
290 |             metadata={
291 |                 "source": dataset_item["url"],
292 |                 "title": dataset_item["aml_title"],
293 |                 "paragraph": dataset_item["paragraph"],
294 |             },
295 |         ),
296 |     )
297 |     embeddings = OpenAIEmbeddings()
298 |     documents = loader.load()
299 | 
300 |     text_splitter = RecursiveCharacterTextSplitter(chunk_size=1000, chunk_overlap=200, length_function = len)
301 |     n = 50
302 |     final = [
303 |         documents[i * n : (i + 1) * n] for i in range((len(documents) + n - 1) // n)
304 |     ]
305 |     docs = text_splitter.split_documents(final[0])
306 | 
307 |     Qdrant.from_documents(docs, embeddings, host=host, collection_name=item.collection)
308 |     for docs in final[1:]:
309 |         print("iterate")
310 |         doc = text_splitter.split_documents(docs)
311 |         if hasattr(doc, "page_content"):
312 |             print("has")
313 |             Qdrant.add_documents(
314 |                 doc, embeddings, host=host, collection_name=item.collection
315 |             )
316 | 
317 | 
318 | class ThreadedGenerator:
319 |     def __init__(self):
320 |         self.queue = queue.Queue()
321 | 
322 |     def __iter__(self):
323 |         return self
324 | 
325 |     def __next__(self):
326 |         item = self.queue.get()
327 |         if item is StopIteration:
328 |             raise item
329 |         return item
330 | 
331 |     def send(self, data):
332 |         self.queue.put(data)
333 | 
334 |     def close(self):
335 |         self.queue.put(StopIteration)
336 | 
337 | 
338 | class ChainStreamHandler(StreamingStdOutCallbackHandler):
339 |     def __init__(self, gen):
340 |         super().__init__()
341 |         self.gen = gen
342 | 
343 |     def on_llm_new_token(self, token: str, **kwargs):
344 |         self.gen.send(token)
345 | 
346 | 
347 | def llm_thread(g, prompt, system_intel, temperature):
348 |     try:
349 |         chat = ChatOpenAI(
350 |             model_name="gpt-3.5-turbo",
351 |             verbose=True,
352 |             streaming=True,
353 |             callback_manager=CallbackManager([ChainStreamHandler(g)]),
354 |             temperature=temperature,
355 |         )
356 | 
357 |         chat([SystemMessage(content=system_intel), HumanMessage(content=prompt)])
358 | 
359 |     finally:
360 |         g.close()
361 | 
362 | 
363 | def chat(prompt, system_intel, temperature):
364 |     g = ThreadedGenerator()
365 |     threading.Thread(
366 |         target=llm_thread, args=(g, prompt, system_intel, temperature)
367 |     ).start()
368 |     return g
369 | 
370 | 
371 | @app.post("/openai/stream")
372 | async def stream(item: GPTQuery, token: str = Depends(get_token)):
373 |     return StreamingResponse(
374 |         chat(item.prompt, item.system_intel, item.temperature),
375 |         media_type="text/event-stream",
376 |     )
377 | 
378 | 
379 | @app.post("/collections/stream")
380 | async def stream(item: Collection, token: str = Depends(get_token)):
381 |     qdrant = Qdrant(
382 |         client, item.collection, embedding_function=OpenAIEmbeddings().embed_query
383 |     )
384 |     retriever = qdrant.as_retriever(search_type="similarity")
385 |     query = item.prompt
386 |     relevant_docs = retriever.get_relevant_documents(query)
387 |     # docs = qdrant.similarity_search(item.prompt)
388 |     template = prompts.documentSearch(item.prompt, relevant_docs)
389 |     return StreamingResponse(
390 |         chat(item.prompt, template, item.temperature), media_type="text/event-stream"
391 |     )
392 | 


--------------------------------------------------------------------------------
/fastapi/gunicorn_conf.py:
--------------------------------------------------------------------------------
 1 | import json
 2 | import multiprocessing
 3 | import os
 4 | 
 5 | workers_per_core_str = os.getenv("WORKERS_PER_CORE", "1")
 6 | max_workers_str = os.getenv("MAX_WORKERS")
 7 | use_max_workers = None
 8 | if max_workers_str:
 9 |     use_max_workers = int(max_workers_str)
10 | web_concurrency_str = os.getenv("WEB_CONCURRENCY", None)
11 | 
12 | host = os.getenv("HOST", "0.0.0.0")
13 | port = os.getenv("PORT", "5000")
14 | bind_env = os.getenv("BIND", None)
15 | use_loglevel = os.getenv("LOG_LEVEL", "info")
16 | if bind_env:
17 |     use_bind = bind_env
18 | else:
19 |     use_bind = f"{host}:{port}"
20 | 
21 | cores = multiprocessing.cpu_count()
22 | workers_per_core = float(workers_per_core_str)
23 | default_web_concurrency = workers_per_core * cores
24 | if web_concurrency_str:
25 |     web_concurrency = int(web_concurrency_str)
26 |     assert web_concurrency > 0
27 | else:
28 |     web_concurrency = max(int(default_web_concurrency), 2)
29 |     if use_max_workers:
30 |         web_concurrency = min(web_concurrency, use_max_workers)
31 | accesslog_var = os.getenv("ACCESS_LOG", "-")
32 | use_accesslog = accesslog_var or None
33 | errorlog_var = os.getenv("ERROR_LOG", "-")
34 | use_errorlog = errorlog_var or None
35 | graceful_timeout_str = os.getenv("GRACEFUL_TIMEOUT", "120")
36 | timeout_str = os.getenv("TIMEOUT", "120")
37 | keepalive_str = os.getenv("KEEP_ALIVE", "5")
38 | 
39 | # Gunicorn config variables
40 | loglevel = use_loglevel
41 | # workers = web_concurrency
42 | # threads = web_concurrency
43 | workers = 4
44 | threads = 4
45 | worker_connections = 1000
46 | bind = use_bind
47 | errorlog = use_errorlog
48 | worker_tmp_dir = "/dev/shm"
49 | accesslog = use_accesslog
50 | graceful_timeout = int(graceful_timeout_str)
51 | timeout = int(timeout_str)
52 | keepalive = int(keepalive_str)
53 | 
54 | # For debugging and testing
55 | log_data = {
56 |     "loglevel": loglevel,
57 |     "workers": workers,
58 |     "threads": threads,
59 |     "worker_connections": worker_connections,
60 |     "bind": bind,
61 |     "graceful_timeout": graceful_timeout,
62 |     "timeout": timeout,
63 |     "keepalive": keepalive,
64 |     "errorlog": errorlog,
65 |     "accesslog": accesslog,
66 |     # Additional, non-gunicorn variables
67 |     "workers_per_core": workers_per_core,
68 |     "use_max_workers": use_max_workers,
69 |     "host": host,
70 |     "port": port,
71 | }
72 | print(json.dumps(log_data))
73 | 


--------------------------------------------------------------------------------
/fastapi/requirements.txt:
--------------------------------------------------------------------------------
 1 | uvicorn[standard]==0.20.0
 2 | gunicorn==20.1.0
 3 | fastapi>=0.89.1
 4 | langchain==0.0.153
 5 | openai>=0.27.1
 6 | qdrant_client>=0.1.0
 7 | python-multipart>=0.0.6
 8 | pypdf>=1.26.0
 9 | pyodc>=0.0.1
10 | python-slugify>=5.0.2
11 | pandas>=1.3.3
12 | python-magic>=0.4.24
13 | bs4>=0.0.1
14 | transformers>=4.11.3
15 | openpyxl>=3.0.9
16 | aiofiles>=0.7.0
17 | asyncio>=3.4.3
18 | unstructured>=0.0.1
19 | aiohttp>=3.7.4.post0
20 | pysrt>=1.1.2
21 | sseclient>=0.0.27
22 | pycryptodome>=3.15.0
23 | apify-client>=0.5.20
24 | tiktoken>=0.0.1
25 | nltk>=3.6.5
26 | spacy>=3.1.4


--------------------------------------------------------------------------------
/fastapi/start-reload.sh:
--------------------------------------------------------------------------------
 1 | 
 2 | set -e
 3 | 
 4 | if [ -f /app/app/main.py ]; then
 5 |     DEFAULT_MODULE_NAME=app.main
 6 | elif [ -f /app/main.py ]; then
 7 |     DEFAULT_MODULE_NAME=main
 8 | fi
 9 | MODULE_NAME=${MODULE_NAME:-$DEFAULT_MODULE_NAME}
10 | VARIABLE_NAME=${VARIABLE_NAME:-app}
11 | export APP_MODULE=${APP_MODULE:-"$MODULE_NAME:$VARIABLE_NAME"}
12 | 
13 | HOST=${HOST:-0.0.0.0}
14 | PORT=${PORT:-5000}
15 | LOG_LEVEL=${LOG_LEVEL:-info}
16 | 
17 | exec uvicorn  --reload --host $HOST --port $PORT  --log-level $LOG_LEVEL "$APP_MODULE" 
18 | 


--------------------------------------------------------------------------------
/fastapi/start.sh:
--------------------------------------------------------------------------------
 1 | #! /usr/bin/env sh
 2 | set -e
 3 | 
 4 | if [ -f /app/app/main.py ]; then
 5 |     DEFAULT_MODULE_NAME=app.main
 6 | elif [ -f /app/main.py ]; then
 7 |     DEFAULT_MODULE_NAME=main
 8 | fi
 9 | MODULE_NAME=${MODULE_NAME:-$DEFAULT_MODULE_NAME}
10 | VARIABLE_NAME=${VARIABLE_NAME:-app}
11 | export APP_MODULE=${APP_MODULE:-"$MODULE_NAME:$VARIABLE_NAME"}
12 |  
13 | if [ -f /app/gunicorn_conf.py ]; then
14 |     DEFAULT_GUNICORN_CONF=/app/gunicorn_conf.py
15 | elif [ -f /app/app/gunicorn_conf.py ]; then
16 |     DEFAULT_GUNICORN_CONF=/app/app/gunicorn_conf.py
17 | else
18 |     DEFAULT_GUNICORN_CONF=/gunicorn_conf.py
19 | fi
20 | export GUNICORN_CONF=${GUNICORN_CONF:-$DEFAULT_GUNICORN_CONF}
21 | export WORKER_CLASS=${WORKER_CLASS:-"uvicorn.workers.UvicornWorker"}
22 | 
23 | # Start Gunicorn
24 | exec gunicorn -k "$WORKER_CLASS" --timeout 360 -c "$GUNICORN_CONF" "$APP_MODULE" 
25 | 
26 | # exec gunicorn -k gevent --timeout 120 --workers=3 --threads=3 --worker-connections=1000 "$APP_MODULE"  --log-level debug
27 | 


--------------------------------------------------------------------------------
/fastapi/submodules/__pycache__/prompts.cpython-310.pyc:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/dagthomas/LangchainComposeChatYourDocs/b13915a6e395b006ad67668c822ddef71b570b16/fastapi/submodules/__pycache__/prompts.cpython-310.pyc


--------------------------------------------------------------------------------
/fastapi/submodules/prompts.py:
--------------------------------------------------------------------------------
 1 | def documentSearch(prompt, docs):
 2 |     template = f"""You are given the following extracted parts of a long document and a question, create a final answer with references.
 3 | 	If you don't know the answer, just say that you don't know. Don't try to make up an answer.
 4 | 	If you know the answer ALWAYS return the sources in the answer.
 5 |     Identify the language and reply in the indetified language. Do not output the identified language.
 6 | 	=========
 7 | 	QUESTION: {prompt}
 8 | 	=========
 9 | 	CONTENT: {docs}
10 | 	=========
11 | 	FINAL ANSWER:"""
12 |     return template
13 | 


--------------------------------------------------------------------------------
/qdrant/Dockerfile:
--------------------------------------------------------------------------------
1 | FROM qdrant/qdrant


--------------------------------------------------------------------------------
/readme.md:
--------------------------------------------------------------------------------
 1 | # LangchainComposeChatYourDocs
 2 | A fastapi, qdrant, langchain, sveltekit starter project with some cool features.
 3 | 
 4 | ## Project Description
 5 | Purpose is to learn, and help others along the way.
 6 | 
 7 | ## Installation and Setup
 8 | Change /fastapi/app/.env.example to .env and fill out the apikey for OpenAI.
 9 | Have Docker Desktop installed
10 | Run: "Docker compose up"
11 | Goto: http://localhost:3000
12 | 
13 | ## Usage
14 | From the startpage, upload a file, webpage or webpages
15 | 
16 | https://www.youtube.com/watch?v=tnB5jOdsPqM
17 | 


--------------------------------------------------------------------------------
/sveltekit/.env:
--------------------------------------------------------------------------------
1 | BODY_SIZE_LIMIT = 0
2 | VITE_BASE_URL=http://localhost:5000
3 | VITE_BASE_FASTAPI_URL=http://fastapi:5000
4 | VITE_BEARER_TOKEN=5pBHDjr4bkNFc1xdqIMR6INLItKuPvZrf8zNdc6enlXqhy8qVO8YCYKRcdd


--------------------------------------------------------------------------------
/sveltekit/.gitignore:
--------------------------------------------------------------------------------
1 | .DS_Store
2 | node_modules
3 | /build
4 | /.svelte-kit
5 | /package
6 | !.env.example
7 | vite.config.js.timestamp-*
8 | vite.config.ts.timestamp-*
9 | 


--------------------------------------------------------------------------------
/sveltekit/.npmrc:
--------------------------------------------------------------------------------
1 | engine-strict=true
2 | 


--------------------------------------------------------------------------------
/sveltekit/.prettierignore:
--------------------------------------------------------------------------------
 1 | .DS_Store
 2 | node_modules
 3 | /build
 4 | /.svelte-kit
 5 | /package
 6 | .env
 7 | .env.*
 8 | !.env.example
 9 | 
10 | # Ignore files for PNPM, NPM and YARN
11 | pnpm-lock.yaml
12 | package-lock.json
13 | yarn.lock
14 | 


--------------------------------------------------------------------------------
/sveltekit/.prettierrc:
--------------------------------------------------------------------------------
 1 | {
 2 | 	"useTabs": true,
 3 | 	"singleQuote": true,
 4 | 	"trailingComma": "none",
 5 | 	"printWidth": 100,
 6 | 	"plugins": ["prettier-plugin-svelte"],
 7 | 	"pluginSearchDirs": ["."],
 8 | 	"overrides": [{ "files": "*.svelte", "options": { "parser": "svelte" } }]
 9 | }
10 | 


--------------------------------------------------------------------------------
/sveltekit/Dockerfile:
--------------------------------------------------------------------------------
 1 | FROM node:16-bullseye-slim AS BUILDER
 2 | LABEL dockerfile.baseimage="node:lts-bullseye-slim" dockerfile.description="LearningLibrary Build Container" dockerfile.stage="BUILDER"
 3 | ENV NODE_ENV development
 4 | ENV BODY_SIZE_LIMIT=0
 5 | ENV ORIGIN=http://localhost:3000
 6 | WORKDIR /usr/src/app
 7 | COPY package.json tsconfig.json ./
 8 | RUN npm i
 9 | COPY . /usr/src/app
10 | RUN npm run build && npm prune --omit=dev
11 | 
12 | FROM gcr.io/distroless/nodejs:16
13 | 
14 | LABEL dockerfile.baseimage="gcr.io/distroless/nodejs:16" dockerfile.description="LearningLibrary Production Container" dockerfile.stage="PRODUCTION"
15 | ENV NODE_ENV production
16 | ENV BODY_SIZE_LIMIT=0
17 | ENV ORIGIN=http://localhost:3000
18 | WORKDIR /usr/src/app
19 | COPY --from=BUILDER /usr/src/app/build ./build
20 | COPY --from=BUILDER /usr/src/app/node_modules ./node_modules
21 | COPY package.json .
22 | 
23 | EXPOSE 3000:3000
24 | CMD ["build"]


--------------------------------------------------------------------------------
/sveltekit/README.md:
--------------------------------------------------------------------------------
 1 | # create-svelte
 2 | 
 3 | Everything you need to build a Svelte project, powered by [`create-svelte`](https://github.com/sveltejs/kit/tree/master/packages/create-svelte).
 4 | 
 5 | ## Creating a project
 6 | 
 7 | If you're seeing this, you've probably already done this step. Congrats!
 8 | 
 9 | ```bash
10 | # create a new project in the current directory
11 | npm create svelte@latest
12 | 
13 | # create a new project in my-app
14 | npm create svelte@latest my-app
15 | ```
16 | 
17 | ## Developing
18 | 
19 | Once you've created a project and installed dependencies with `npm install` (or `pnpm install` or `yarn`), start a development server:
20 | 
21 | ```bash
22 | npm run dev
23 | 
24 | # or start the server and open the app in a new browser tab
25 | npm run dev -- --open
26 | ```
27 | 
28 | ## Building
29 | 
30 | To create a production version of your app:
31 | 
32 | ```bash
33 | npm run build
34 | ```
35 | 
36 | You can preview the production build with `npm run preview`.
37 | 
38 | > To deploy your app, you may need to install an [adapter](https://kit.svelte.dev/docs/adapters) for your target environment.
39 | 


--------------------------------------------------------------------------------
/sveltekit/package.json:
--------------------------------------------------------------------------------
 1 | {
 2 | 	"name": "sveltekit",
 3 | 	"version": "0.0.1",
 4 | 	"private": true,
 5 | 	"scripts": {
 6 | 		"dev": "vite dev",
 7 | 		"build": "BODY_SIZE_LIMIT=20000000 vite build",
 8 | 		"preview": "vite preview",
 9 | 		"test": "playwright test",
10 | 		"check": "svelte-kit sync && svelte-check --tsconfig ./tsconfig.json",
11 | 		"check:watch": "svelte-kit sync && svelte-check --tsconfig ./tsconfig.json --watch",
12 | 		"test:unit": "vitest",
13 | 		"lint": "prettier --plugin-search-dir . --check .",
14 | 		"format": "prettier --plugin-search-dir . --write ."
15 | 	},
16 | 	"devDependencies": {
17 | 		"@playwright/test": "^1.28.1",
18 | 		"@sveltejs/adapter-node": "^1.2.4",
19 | 		"@sveltejs/kit": "^1.15.10",
20 | 		"autoprefixer": "^10.4.13",
21 | 		"postcss": "^8.4.21",
22 | 		"prettier": "^2.8.0",
23 | 		"prettier-plugin-svelte": "^2.8.1",
24 | 		"svelte": "^3.58.0",
25 | 		"svelte-check": "^3.0.1",
26 | 		"tailwindcss": "^3.3.1",
27 | 		"tslib": "^2.4.1",
28 | 		"typescript": "^4.9.3",
29 | 		"vite": "^4.3.4",
30 | 		"vitest": "^0.25.3"
31 | 	},
32 | 	"type": "module",
33 | 	"dependencies": {
34 | 		"@auth/core": "^0.5.1",
35 | 		"@auth/sveltekit": "^0.3.0",
36 | 		"@fontsource/poppins": "^4.5.10",
37 | 		"daisyui": "^2.51.5",
38 | 		"dotenv": "^16.0.3",
39 | 		"openai": "^3.2.1"
40 | 	}
41 | }


--------------------------------------------------------------------------------
/sveltekit/playwright.config.ts:
--------------------------------------------------------------------------------
 1 | import type { PlaywrightTestConfig } from '@playwright/test';
 2 | 
 3 | const config: PlaywrightTestConfig = {
 4 | 	webServer: {
 5 | 		command: 'npm run build && npm run preview',
 6 | 		port: 4173
 7 | 	},
 8 | 	testDir: 'tests'
 9 | };
10 | 
11 | export default config;
12 | 


--------------------------------------------------------------------------------
/sveltekit/postcss.config.cjs:
--------------------------------------------------------------------------------
1 | module.exports = {
2 |   plugins: {
3 |     tailwindcss: {},
4 |     autoprefixer: {},
5 |   },
6 | }
7 | 


--------------------------------------------------------------------------------
/sveltekit/src/app.css:
--------------------------------------------------------------------------------
 1 | @tailwind base;
 2 | @tailwind components;
 3 | @tailwind utilities;
 4 |     * {
 5 |         scrollbar-color: rgb(195,60,102) #061E30;
 6 |     }
 7 |     
 8 |     *::-webkit-scrollbar {
 9 |         width: 5px;
10 |     }
11 |     /* Track */
12 |     
13 |     *::-webkit-scrollbar-track {
14 |         background: #061E30
15 |     }
16 |     
17 |     *::-webkit-scrollbar-thumb {
18 |         background: rgb(195,60,102);
19 |     }


--------------------------------------------------------------------------------
/sveltekit/src/app.d.ts:
--------------------------------------------------------------------------------
 1 | // See https://kit.svelte.dev/docs/types#app
 2 | // for information about these interfaces
 3 | declare global {
 4 | 	namespace App {
 5 | 		// interface Error {}
 6 | 		// interface Locals {}
 7 | 		// interface PageData {}
 8 | 		// interface Platform {}
 9 | 	}
10 | }
11 | 
12 | export {};
13 | 


--------------------------------------------------------------------------------
/sveltekit/src/app.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | <html lang="en" class="bg-ll-primary">
 3 | 	<head>
 4 | 		<meta charset="utf-8" />
 5 | 		<link rel="icon" href="%sveltekit.assets%/favicon.png" />
 6 | 		<meta name="viewport" content="width=device-width" />
 7 | 		%sveltekit.head%
 8 | 	</head>
 9 | 	<body data-sveltekit-preload-data="hover" >
10 | 		<div style="display: contents">%sveltekit.body%</div>
11 | 	</body>
12 | </html>
13 | 


--------------------------------------------------------------------------------
/sveltekit/src/hooks.server.ts:
--------------------------------------------------------------------------------
 1 | import { SvelteKitAuth } from '@auth/sveltekit';
 2 | import Auth0 from '@auth/core/providers/auth0';
 3 | import type { Profile } from '@auth/core/types';
 4 | import type { Provider } from '@auth/core/providers';
 5 | import { sequence } from '@sveltejs/kit/hooks';
 6 | import { redirect, type Handle } from '@sveltejs/kit';
 7 | 
 8 | /*
 9 | HANDLE REQUESTS
10 | */
11 | export const base = (async ({ event, resolve }) => {
12 | 	const response = await resolve(event, {
13 | 		transformPageChunk: ({ html }) => html
14 | 	});
15 | 
16 | 	return response;
17 | }) satisfies Handle;
18 | 
19 | export let auth = SvelteKitAuth({
20 | 	providers: [
21 | 		Auth0({
22 | 			// authorization: {
23 | 			// 	params: {
24 | 			// 		//   redirect_uri: redirectUrl,
25 | 			// 		scope: auth0Scope,
26 | 			// 		audience: auth0Audience
27 | 			// 	}
28 | 			// },
29 | 			clientId: '',
30 | 			clientSecret: '',
31 | 			issuer: ''
32 | 		}) as Provider<Profile>
33 | 	],
34 | 	trustHost: true,
35 | 	callbacks: {},
36 | 	secret: 'my secret in numbers'
37 | });
38 | //export const handle: Handle = sequence(base)
39 | async function authorization({ event, resolve }) {
40 | 	if (event.url.pathname.indexOf('/sql') !== -1) {
41 | 		const session = await event.locals.getSession();
42 | 		console.log(session);
43 | 		if (!session) {
44 | 			throw redirect(303, '/');
45 | 		}
46 | 	}
47 | 	const result = await resolve(event, {
48 | 		transformPageChunk: ({ html }) => html
49 | 	});
50 | 	return result;
51 | }
52 | export const handle: Handle = base;
53 | 


--------------------------------------------------------------------------------
/sveltekit/src/index.test.ts:
--------------------------------------------------------------------------------
1 | import { describe, it, expect } from 'vitest';
2 | 
3 | describe('sum test', () => {
4 | 	it('adds 1 + 2 to equal 3', () => {
5 | 		expect(1 + 2).toBe(3);
6 | 	});
7 | });
8 | 


--------------------------------------------------------------------------------
/sveltekit/src/lib/components/PrismJS.svelte:
--------------------------------------------------------------------------------
 1 | <script>
 2 | 	import { onMount } from 'svelte';
 3 | 
 4 | 	export let language;
 5 | 	export let code;
 6 | 	export let header;
 7 | 
 8 | 	onMount(() => {
 9 | 		let script = document.createElement('script');
10 | 		script.src = 'https://tutsplus.github.io/syntax-highlighter-demos/highlighters/Prism/prism.js';
11 | 		document.head.append(script);
12 | 
13 | 		script.onload = function () {
14 | 			let langJS = false;
15 | 			let lang_script;
16 | 			let lang_module;
17 | 
18 | 			// This switch statement, evaluates what language is being used, if one of a key language is being used, it will
19 | 			// load the proper Prisim support tool, like Python requires "prism-python.js" to modify the raw code so that
20 | 			// Prisim can render it properly.
21 | 			switch (language) {
22 | 				case 'json':
23 | 					lang_module = 'https://prismjs.com/components/prism-json.js';
24 | 					langJS = true;
25 | 					break;
26 | 
27 | 				case 'python':
28 | 					lang_module = 'https://prismjs.com/components/prism-python.js';
29 | 					langJS = true;
30 | 					break;
31 | 
32 | 				case 'rust':
33 | 					lang_module = 'https://prismjs.com/components/prism-rust.js';
34 | 					langJS = true;
35 | 					break;
36 | 
37 | 				case 'r':
38 | 					lang_module = 'https://prismjs.com/components/prism-r.js';
39 | 					langJS = true;
40 | 					break;
41 | 
42 | 				case 'sql':
43 | 					lang_module = 'https://prismjs.com/components/prism-sql.js';
44 | 					langJS = true;
45 | 					break;
46 | 			}
47 | 
48 | 			if (langJS == true) {
49 | 				lang_script = document.createElement('script');
50 | 				lang_script.src = lang_module;
51 | 				lang_script.async = true;
52 | 				document.head.append(lang_script);
53 | 
54 | 				lang_script.onload = () => {
55 | 					Prism.highlightAll();
56 | 				};
57 | 			} else {
58 | 				Prism.highlightAll();
59 | 			}
60 | 		};
61 | 	});
62 | </script>
63 | 
64 | <svelte:head>
65 | 	<link
66 | 		rel="stylesheet"
67 | 		href="https://fonts.googleapis.com/css?family=Open+Sans:400,700"
68 | 		type="text/css"
69 | 	/>
70 | 	<link
71 | 		rel="stylesheet"
72 | 		href="https://tutsplus.github.io/syntax-highlighter-demos/highlighters/Prism/prism_okaidia.css"
73 | 	/>
74 | </svelte:head>
75 | 
76 | <div class="w3-container mt-4">
77 | 	<h2 class="text-white">{header}</h2>
78 | 	<pre><code class="language-{language}">{code}</code></pre>
79 | </div>
80 | 
81 | <style>
82 | 	pre {
83 | 		white-space: pre-wrap; /* css-3 */
84 | 		white-space: -moz-pre-wrap; /* Mozilla, since 1999 */
85 | 		white-space: -pre-wrap; /* Opera 4-6 */
86 | 		white-space: -o-pre-wrap; /* Opera 7 */
87 | 		word-wrap: break-word; /* Internet Explorer 5.5+ */
88 | 	}
89 | 	pre code {
90 | 		white-space: pre-wrap; /* css-3 */
91 | 		white-space: -moz-pre-wrap; /* Mozilla, since 1999 */
92 | 		white-space: -pre-wrap; /* Opera 4-6 */
93 | 		white-space: -o-pre-wrap; /* Opera 7 */
94 | 		word-wrap: break-word; /* Internet Explorer 5.5+ */
95 | 	}
96 | </style>
97 | 


--------------------------------------------------------------------------------
/sveltekit/src/lib/components/chatbot.svelte:
--------------------------------------------------------------------------------
  1 | <script lang="ts">
  2 | 
  3 | 	import { conversation } from '$lib/conversationStore';
  4 | 	import { goto } from '$app/navigation';
  5 | 	import Prism from '$lib/components/PrismJS.svelte';
  6 | 	export let collection: any;
  7 | 	export let collections: any;
  8 | 	export let index: any;
  9 | 	let prompt: string = '';
 10 | 	$: prompt = prompt;
 11 | 
 12 | 	let mode = 0;
 13 | 	$: mode = mode;
 14 | 	let searching = false;
 15 | 	const onKeyPress = async (e) => {
 16 | 		if (e.charCode === 13) {
 17 | 			let oldprompt = prompt;
 18 | 
 19 | 			searching = true;
 20 | 			prompt = '';
 21 | 			const settings = {
 22 | 				method: 'POST',
 23 | 				headers: {
 24 | 					Accept: 'application/json',
 25 | 					'Content-Type': 'application/json'
 26 | 				},
 27 | 				body: JSON.stringify({
 28 | 					query: oldprompt,
 29 | 					collection: collection,
 30 | 					temperature: 0.5,
 31 | 					index: index
 32 | 				})
 33 | 			};
 34 | 			try {
 35 | 				$conversation = [
 36 | 					...$conversation,
 37 | 					{
 38 | 						bot: false,
 39 | 						error: false,
 40 | 						message: oldprompt,
 41 | 						date: new Date().toLocaleDateString('nb-NO')
 42 | 					}
 43 | 				];
 44 | 				const fetchResponse = await fetch(`/api/queryGPT`, settings);
 45 | 				const data = await fetchResponse.json();
 46 | 
 47 | 				$conversation = [
 48 | 					...$conversation,
 49 | 					{
 50 | 						bot: true,
 51 | 						error: false,
 52 | 						message: data,
 53 | 						date: new Date().toLocaleDateString('nb-NO')
 54 | 					}
 55 | 				];
 56 | 				output = data;
 57 | 				searching = false;
 58 | 				return data;
 59 | 			} catch (e) {
 60 | 				$conversation = [
 61 | 					...$conversation,
 62 | 					{
 63 | 						bot: true,
 64 | 						error: true,
 65 | 						message: 'Det skjedde en feil, prøv igjen senere...',
 66 | 						date: new Date().toLocaleDateString('nb-NO')
 67 | 					}
 68 | 				];
 69 | 				searching = false;
 70 | 				prompt = oldprompt;
 71 | 				return e;
 72 | 			}
 73 | 		}
 74 | 	};
 75 | 
 76 | 	$: selected = collection;
 77 | 
 78 | 
 79 | 
 80 | 	import { fade, fly } from 'svelte/transition';
 81 | 	import type { AnymatchFn } from 'vite';
 82 | 	import { dataset_dev } from 'svelte/internal';
 83 | </script>
 84 | 
 85 | <div class="flex flex-col h-screen overflow-x-hidden">
 86 | 	<div class="px-12 pt-12 pb-12 flex-grow overflow-x-hidden">
 87 | 		<div class="chat chat-start overflow-x-hidden">
 88 | 			<div class="chat-image avatar">
 89 | 				<div class="w-16 mask mask-round">
 90 | 					<img src="/profile-image.png" />
 91 | 				</div>
 92 | 			</div>
 93 | 
 94 | 			<div class="chat-header">
 95 | 				dagthomasBot
 96 | 				<time class="text-xs opacity-50"
 97 | 					>{new Date().toLocaleTimeString('nb-NO', { hour: 'numeric', minute: 'numeric' })}</time
 98 | 				>
 99 | 			</div>
100 | 			<div class="chat-bubble">
101 | 				<span>Hello there, I am <strong>dagthomasBot</strong>, what can I help you with? </span>
102 | 			</div>
103 | 		</div>
104 | 		{#each $conversation as item}
105 | 			{#if item?.bot}
106 | 				<div class="chat chat-start" in:fade={{ duration: 250 }} out:fade>
107 | 					<div class="chat-image  avatar">
108 | 						<div class="w-16 mask mask-round">
109 | 							<img src="/profile-image.png" />
110 | 						</div>
111 | 					</div>
112 | 					<div class="chat-header">
113 | 						dagthomasBot
114 | 						<time class="text-xs opacity-50"
115 | 							>{item?.data ||
116 | 								new Date().toLocaleTimeString('nb-NO', {
117 | 									hour: 'numeric',
118 | 									minute: 'numeric'
119 | 								})}</time
120 | 						>
121 | 					</div>
122 | 					<div class="chat-bubble">
123 | 						{#if item?.message?.output_text}
124 | 							{item?.message?.output_text}
125 | 						{:else}
126 | 							<Prism
127 | 								language="json"
128 | 								code={JSON.stringify(item?.message, null, 2)}
129 | 								header="Qdrant Search Results"
130 | 							/>
131 | 						{/if}
132 | 					</div>
133 | 				</div>
134 | 			{:else}
135 | 				<div class="chat chat-end" in:fly={{ x: 50, duration: 250 }} out:fade>
136 | 					<div class="chat-header">
137 | 						User
138 | 						<time class="text-xs opacity-50"
139 | 							>{item?.data ||
140 | 								new Date().toLocaleTimeString('nb-NO', {
141 | 									hour: 'numeric',
142 | 									minute: 'numeric'
143 | 								})}</time
144 | 						>
145 | 					</div>
146 | 					<div class="chat-bubble">
147 | 						{#if item?.message?.output_text}
148 | 							{item?.message?.output_text}
149 | 						{:else}
150 | 							{item?.message}
151 | 						{/if}
152 | 					</div>
153 | 				</div>
154 | 			{/if}
155 | 		{/each}
156 | 		{#if searching}
157 | 			<div class="chat chat-start">
158 | 				<div class="chat-image  avatar">
159 | 					<div class="w-16 mask mask-round">
160 | 						<img src="/profile-image.png" />
161 | 					</div>
162 | 				</div>
163 | 
164 | 				<div class="chat-header">
165 | 					dagthomasBot
166 | 					<time class="text-xs opacity-50"
167 | 						>{new Date().toLocaleTimeString('nb-NO', { hour: 'numeric', minute: 'numeric' })}</time
168 | 					>
169 | 				</div>
170 | 				<div class="chat-bubble">
171 | 					<div
172 | 						role="status"
173 | 						class="absolute -translate-x-1/2 -translate-y-1/2 top-2/4 left-1/2 pl-2"
174 | 					>
175 | 						<svg
176 | 							aria-hidden="true"
177 | 							class="w-8 h-8 mr-2  animate-spin text-gray-600 fill-blue-600"
178 | 							viewBox="0 0 100 101"
179 | 							fill="none"
180 | 							xmlns="http://www.w3.org/2000/svg"
181 | 							><path
182 | 								d="M100 50.5908C100 78.2051 77.6142 100.591 50 100.591C22.3858 100.591 0 78.2051 0 50.5908C0 22.9766 22.3858 0.59082 50 0.59082C77.6142 0.59082 100 22.9766 100 50.5908ZM9.08144 50.5908C9.08144 73.1895 27.4013 91.5094 50 91.5094C72.5987 91.5094 90.9186 73.1895 90.9186 50.5908C90.9186 27.9921 72.5987 9.67226 50 9.67226C27.4013 9.67226 9.08144 27.9921 9.08144 50.5908Z"
183 | 								fill="currentColor"
184 | 							/><path
185 | 								d="M93.9676 39.0409C96.393 38.4038 97.8624 35.9116 97.0079 33.5539C95.2932 28.8227 92.871 24.3692 89.8167 20.348C85.8452 15.1192 80.8826 10.7238 75.2124 7.41289C69.5422 4.10194 63.2754 1.94025 56.7698 1.05124C51.7666 0.367541 46.6976 0.446843 41.7345 1.27873C39.2613 1.69328 37.813 4.19778 38.4501 6.62326C39.0873 9.04874 41.5694 10.4717 44.0505 10.1071C47.8511 9.54855 51.7191 9.52689 55.5402 10.0491C60.8642 10.7766 65.9928 12.5457 70.6331 15.2552C75.2735 17.9648 79.3347 21.5619 82.5849 25.841C84.9175 28.9121 86.7997 32.2913 88.1811 35.8758C89.083 38.2158 91.5421 39.6781 93.9676 39.0409Z"
186 | 								fill="currentFill"
187 | 							/></svg
188 | 						>
189 | 						<span class="sr-only">Writing answer...</span>
190 | 					</div>
191 | 				</div>
192 | 			</div>
193 | 		{/if}
194 | 	</div>
195 | 	<div class="navbar mb-4">
196 | 		<div class="flex-1 justify-center">
197 | 			<input
198 | 				type="text"
199 | 				placeholder="Ask a question"
200 | 				class="input input-bordered w-3/6 border-ll-s-1 border-2"
201 | 				bind:value={prompt}
202 | 				name="message"
203 | 				on:keypress={onKeyPress}
204 | 			/>
205 | 		</div>
206 | 	</div>
207 | 	<div class="absolute right-0 top-0 mt-8 mr-8">
208 | 		<h1 class="mb-2 ml-1 font-bold">Collections</h1>
209 | 		<select
210 | 			class="select select-bordered  max-w-xs select-sm"
211 | 			bind:value={selected}
212 | 			on:change={() => goto(selected)}
213 | 		>
214 | 			{#each collections as collection}
215 | 				<option value={collection.name}> {collection.name}</option>
216 | 			{/each}
217 | 		</select>
218 | 	</div>
219 | </div>
220 | 


--------------------------------------------------------------------------------
/sveltekit/src/lib/components/chatbotstream.svelte:
--------------------------------------------------------------------------------
  1 | <script lang="ts">
  2 | 	const baseUrl = import.meta.env.VITE_BASE_URL
  3 | 	const bearerToken = import.meta.env.VITE_BEARER_TOKEN
  4 | 	import { conversation } from '$lib/conversationStore';
  5 | 	$conversation = [];
  6 | 	import { streamstore } from '$lib/streamStore';
  7 | 	$streamstore = [];
  8 | 	let answer: any = [];
  9 | 	$: answer = answer;
 10 | 	let streaming: boolean;
 11 | 	$: streaming = streaming;
 12 | 	import { goto } from '$app/navigation';
 13 | 
 14 | 	export let collection: any;
 15 | 	export let collections: any;
 16 | 	export let index: any;
 17 | 	let prompt: string = '';
 18 | 	$: prompt = prompt;
 19 | 
 20 | 	let mode = 0;
 21 | 
 22 | 
 23 | 	$: mode = mode;
 24 | 
 25 | 
 26 | 	let searching = false;
 27 | 	const onKeyPress = async (e) => {
 28 | 		streaming = true;
 29 | 		if (e.charCode === 13) {
 30 | 			let oldprompt = prompt;
 31 | 
 32 | 			searching = true;
 33 | 			prompt = '';
 34 | 
 35 | 			try {
 36 | 				$conversation = [
 37 | 					...$conversation,
 38 | 					{
 39 | 						json: false,
 40 | 						bot: false,
 41 | 						error: false,
 42 | 						message: oldprompt,
 43 | 						date: new Date().toLocaleDateString('nb-NO')
 44 | 					}
 45 | 				];
 46 | 				console.log({
 47 | 					collection: collection,
 48 | 					prompt: oldprompt,
 49 | 					temperature: 0
 50 | 				});
 51 | 				const response = await fetch(`${baseUrl}/collections/stream`, {
 52 | 					method: 'POST', // or 'PUT'
 53 | 					headers: {
 54 | 						'Content-Type': 'application/json',
 55 | 						Authorization: `Bearer ${bearerToken}`
 56 | 					},
 57 | 					body: JSON.stringify({
 58 | 						collection: collection,
 59 | 						prompt: oldprompt,
 60 | 						temperature: 0
 61 | 					})
 62 | 				});
 63 | 
 64 | 				const stream = response.body;
 65 | 				const reader = stream.getReader();
 66 | 				const decoder = new TextDecoder();
 67 | 				const readStream = async () => {
 68 | 					while (true) {
 69 | 						const { done, value } = await reader.read();
 70 | 						if (done) {
 71 | 							streaming = false;
 72 | 							return;
 73 | 						}
 74 | 
 75 | 						const decodedValue = decoder.decode(value);
 76 | 						$streamstore = [...$streamstore, decodedValue];
 77 | 					}
 78 | 				};
 79 | 
 80 | 				await readStream();
 81 | 				// const fetchResponse = await fetch(`/api/queryGPT`, settings);
 82 | 				// const data = await fetchResponse.json();
 83 | 
 84 | 				searching = false;
 85 | 			} catch (e) {
 86 | 				$conversation = [
 87 | 					...$conversation,
 88 | 					{
 89 | 						bot: true,
 90 | 						error: true,
 91 | 						message: 'Det skjedde en feil, prøv igjen senere...',
 92 | 						date: new Date().toLocaleDateString('nb-NO')
 93 | 					}
 94 | 				];
 95 | 				searching = false;
 96 | 				prompt = oldprompt;
 97 | 				return e;
 98 | 			}
 99 | 		}
100 | 	};
101 | 
102 | 	$: selected = collection;
103 | 	$: streamstoreoutput = '';
104 | 	import { fade, fly } from 'svelte/transition';
105 | 	const scrollToBottom = (node) => {
106 | 		const scroll = () =>
107 | 			node.scroll({
108 | 				top: node.scrollHeight,
109 | 				behavior: 'smooth'
110 | 			});
111 | 		scroll();
112 | 
113 | 		return { update: scroll };
114 | 	};
115 | 
116 | 	$: {
117 | 		streamstoreoutput = $streamstore.join('');
118 | 
119 | 		if (streaming === false) {
120 | 			let data = $streamstore.join('');
121 | 			$conversation = [
122 | 				...$conversation,
123 | 				{
124 | 					json: false,
125 | 					bot: true,
126 | 					error: false,
127 | 					message: data,
128 | 					date: new Date().toLocaleDateString('nb-NO')
129 | 				}
130 | 			];
131 | 			$streamstore = [];
132 | 		}
133 | 	}
134 | function replaceLinks(text: string) {
135 | 	const regex = /(https?:\/\/[^\s)]+)/g;
136 | 	const replacedText = text.replace(regex, '<a class="text-ll-s-1" href="$1" onclick="window.open($1); return false;">$1</a>');
137 | 	return replacedText;
138 | }
139 | </script>
140 | 
141 | <svelte:window />
142 | <div class="flex flex-col h-screen overflow-x-hidden">
143 | 	<div class="px-12 pt-12 pb-12 flex-grow overflow-x-hidden" use:scrollToBottom={$streamstore}>
144 | 		<div class="chat chat-start overflow-x-hidden">
145 | 			<div class="chat-image avatar">
146 | 				<div class="w-16 mask mask-round">
147 | 					<img src="/profile-image.png" />
148 | 				</div>
149 | 			</div>
150 | 
151 | 			<div class="chat-header">
152 | 				dagthomasBot
153 | 				<time class="text-xs opacity-50"
154 | 					>{new Date().toLocaleTimeString('nb-NO', { hour: 'numeric', minute: 'numeric' })}</time
155 | 				>
156 | 			</div>
157 | 			<div class="chat-bubble bg-ll-p-dark">
158 | 				<span>Hello there, I am <strong>dagthomasBot</strong>, what can I help you with? </span>
159 | 			</div>
160 | 		</div>
161 | 		{#each $conversation as item}
162 | 			{#if item?.bot}
163 | 				<div class="chat chat-start" out:fade>
164 | 					<div class="chat-image avatar">
165 | 						<div class="w-16 mask mask-round">
166 | 							<img src="/profile-image.png" />
167 | 						</div>
168 | 					</div>
169 | 					<div class="chat-header">
170 | 						dagthomasBot
171 | 						<time class="text-xs opacity-50"
172 | 							>{item?.data ||
173 | 								new Date().toLocaleTimeString('nb-NO', {
174 | 									hour: 'numeric',
175 | 									minute: 'numeric'
176 | 								})}</time
177 | 						>
178 | 					</div>
179 | 					<div class="pre chat-bubble bg-ll-p-dark">
180 | 						{@html replaceLinks(item?.message)}
181 | 					</div>
182 | 				</div>
183 | 			{:else}
184 | 				<div class="chat chat-end" in:fly={{ x: 50, duration: 250 }} out:fade>
185 | 					<div class="chat-header">
186 | 						User
187 | 						<time class="text-xs opacity-50"
188 | 							>{item?.data ||
189 | 								new Date().toLocaleTimeString('nb-NO', {
190 | 									hour: 'numeric',
191 | 									minute: 'numeric'
192 | 								})}</time
193 | 						>
194 | 					</div>
195 | 					<div class="pre chat-bubble bg-ll-s-1 text-white">
196 | 						{item?.message}
197 | 					</div>
198 | 				</div>
199 | 			{/if}
200 | 		{/each}
201 | 		{#if searching}
202 | 			<div class="chat chat-start" in:fly={{ x: -150, duration: 500, delay: 750 }}>
203 | 				<div class="chat-image avatar">
204 | 					<div class="w-16 mask mask-round">
205 | 						<img src="/profile-image.png" />
206 | 					</div>
207 | 				</div>
208 | 				<div class="chat-header" in:fade={{ duration: 250 }}>
209 | 					dagthomasBot
210 | 					<time class="text-xs opacity-50"
211 | 						>{new Date().toLocaleTimeString('nb-NO', {
212 | 							hour: 'numeric',
213 | 							minute: 'numeric'
214 | 						})}</time
215 | 					>
216 | 				</div>
217 | 				{#if streamstoreoutput.length > 0}
218 | 					<div class="chat-bubble bg-ll-p-dark" in:fade={{ duration: 750 }}>
219 | 						{#each [...streamstoreoutput] as word}
220 | 							<span in:fade={{ duration: 75 }} class="pre">{word}</span>
221 | 						{/each}
222 | 					</div>
223 | 				{/if}
224 | 			</div>
225 | 		{/if}
226 | 	</div>
227 | 	<div class="navbar mb-4">
228 | 		<div class="flex-1 justify-center">
229 | 			<input
230 | 				type="text"
231 | 				placeholder="Ask a question"
232 | 				class="input input-bordered w-3/6 border-ll-s-1 border-2"
233 | 				bind:value={prompt}
234 | 				name="message"
235 | 				on:keypress={onKeyPress}
236 | 			/>
237 | 		</div>
238 | 	</div>
239 | 	<div class="absolute right-0 top-0 mt-8 mr-8">
240 | 		<h1 class="mb-2 ml-1 font-bold">Collections</h1>
241 | 		<select
242 | 			class="select select-bordered max-w-xs select-sm"
243 | 			bind:value={selected}
244 | 			on:change={() => goto(selected)}
245 | 		>
246 | 			{#each collections as collection}
247 | 				<option value={collection.name}> {collection.name}</option>
248 | 			{/each}
249 | 		</select>
250 | 	</div>
251 | </div>
252 | 
253 | <style>
254 | 	.pre {
255 | 		white-space: pre-line;
256 | 	}
257 | 	/* .chat-image {
258 | 		align-self: flex-start;
259 | 	} */
260 | 	:global(html) {
261 | 		scroll-behavior: smooth;
262 | 	}
263 | 
264 | </style>
265 | 


--------------------------------------------------------------------------------
/sveltekit/src/lib/conversationStore.ts:
--------------------------------------------------------------------------------
1 | import { writable } from 'svelte/store';
2 | 
3 | export const conversation = writable([]);
4 | 


--------------------------------------------------------------------------------
/sveltekit/src/lib/streamStore.ts:
--------------------------------------------------------------------------------
1 | import { writable } from 'svelte/store';
2 | 
3 | export const streamstore = writable([]);
4 | 


--------------------------------------------------------------------------------
/sveltekit/src/routes/+layout.server.ts:
--------------------------------------------------------------------------------
 1 | 
 2 | const baseFastapiUrl = import.meta.env.VITE_BASE_FASTAPI_URL
 3 | const bearerToken = import.meta.env.VITE_BEARER_TOKEN
 4 | export const load = async ({ }) => {
 5 | 	try {
 6 | 		const response = await fetch(`${baseFastapiUrl}/collections`, {
 7 | 			method: 'GET',
 8 | 			headers: {
 9 | 				'Content-Type': 'application/json',
10 | 				Authorization: `Bearer ${bearerToken}`
11 | 			}
12 | 		});
13 | 		if (response.status === 404) {
14 | 			throw new Error('Page not found');
15 | 		} else if (response.status === 500) {
16 | 			throw new Error('Server error');
17 | 		} else if (!response.ok) {
18 | 			throw new Error(`HTTP error! status: ${response.status}`);
19 | 		}
20 | 
21 | 		return { collections: await response.json() };
22 | 	} catch (error) {
23 | 		return {};
24 | 	}
25 | };
26 | 


--------------------------------------------------------------------------------
/sveltekit/src/routes/+layout.svelte:
--------------------------------------------------------------------------------
 1 | <script lang="ts">
 2 | 	import '../app.css';
 3 | 	import '@fontsource/poppins';
 4 | 	import '@fontsource/poppins/300.css';
 5 | 	import '@fontsource/poppins/500.css';
 6 | 	import '@fontsource/poppins/600.css';
 7 | </script>
 8 | 
 9 | <div class="">
10 | 	<slot />
11 | </div>
12 | 


--------------------------------------------------------------------------------
/sveltekit/src/routes/+page.server.ts:
--------------------------------------------------------------------------------
 1 | const baseFastapiUrl = import.meta.env.VITE_BASE_FASTAPI_URL
 2 | const bearerToken = import.meta.env.VITE_BEARER_TOKEN
 3 | console.log(bearerToken)
 4 | export const load = async ({ parent }) => {
 5 | 	const { collections } = await parent();
 6 | 	return { collections };
 7 | };
 8 | 
 9 | export const actions = {
10 | 	upload: async ({ request }) => {
11 | 		const formData = await request.formData();
12 | 		const response = await fetch(`${baseFastapiUrl}/upload`, {
13 | 			method: 'POST', // or 'PUT'
14 | 			headers: {
15 | 				Authorization: `Bearer ${bearerToken}`
16 | 			},
17 | 			body: formData
18 | 		});
19 | 
20 | 		if (!response.ok) {
21 | 			return { success: false };
22 | 		}
23 | 		return { success: true, result: await response.json() };
24 | 	},
25 | 	webpage: async ({ request }) => {
26 | 		const data = await request.formData();
27 | 		const link = data.get('link');
28 | 
29 | 		const response = await fetch(`${baseFastapiUrl}/webpage`, {
30 | 			method: 'POST',
31 | 			headers: {
32 | 				'Content-Type': 'application/json',
33 | 				Authorization: `Bearer ${bearerToken}`
34 | 			},
35 | 			body: JSON.stringify({
36 | 				url: link
37 | 			})
38 | 		});
39 | 
40 | 		if (!response.ok) {
41 | 			return { success: false };
42 | 		}
43 | 		return { success: true, result: await response.json() };
44 | 	},
45 | 	webpages: async ({ request }) => {
46 | 		const formdata = await request.formData();
47 | 		let collection_name = formdata.get('collection_name');
48 | 		const data = Object.fromEntries(formdata);
49 | 
50 | 		let cleanedData = Object.keys(data)
51 | 			.map(function (key, value) {
52 | 				if (key !== 'collection_name') {
53 | 					if (
54 | 						/^(http(s):\/\/.)[-a-zA-Z0-9@:%._\+~#=]{2,256}\.[a-z]{2,6}\b([-a-zA-Z0-9@:%_\+.~#?&//=]*)$/g.test(
55 | 							data[key].toString()
56 | 						) === true
57 | 					) {
58 | 						return data[key];
59 | 					}
60 | 				}
61 | 			})
62 | 			.filter((item) => !!item);
63 | 		if (collection_name === '') {
64 | 			collection_name = `collection-${Math.floor(Math.random() * 100000)}`;
65 | 		}
66 | 		console.log(collection_name);
67 | 		const response = await fetch(`${baseFastapiUrl}/webpages`, {
68 | 			method: 'POST',
69 | 			headers: {
70 | 				'Content-Type': 'application/json',
71 | 				Authorization: `Bearer ${bearerToken}`
72 | 			},
73 | 			body: JSON.stringify({
74 | 				urls: cleanedData,
75 | 				collection_name: collection_name
76 | 			})
77 | 		});
78 | 
79 | 		if (!response.ok) {
80 | 			return { success: false };
81 | 		}
82 | 		return { success: true, result: await response.json() };
83 | 	}
84 | };
85 | 


--------------------------------------------------------------------------------
/sveltekit/src/routes/+page.svelte:
--------------------------------------------------------------------------------
  1 | <script type="ts">
  2 | 	let types = 'Files';
  3 | 	import { enhance } from '$app/forms';
  4 | 	import { goto } from '$app/navigation';
  5 | 	import { fade, fly } from 'svelte/transition';
  6 | 	export let form;
  7 | 	let formData;
  8 | 
  9 | 	$: if (form?.result) {
 10 | 		if (form?.result === 'Filetype not supported') {
 11 | 			alert('Filetype not supported');
 12 | 			sending = false;
 13 | 		} else {
 14 | 			let returnData = form?.result;
 15 | 			let returnString = `/collection/${returnData}`;
 16 | 			goto(returnString);
 17 | 		}
 18 | 	}
 19 | 	var num_links = 1;
 20 | 	const addField = () => {
 21 | 		if (num_links < 5) {
 22 | 			num_links += 1;
 23 | 		}
 24 | 	};
 25 | 
 26 | 	const removeField = (div) => {
 27 | 		num_links -= 1;
 28 | 	};
 29 | 	let sending = false;
 30 | 	let collection_name = `collection-${Math.floor(Math.random() * 100000)}`;
 31 | </script>
 32 | 
 33 | <div class="flex flex-col items-center justify-center h-screen">
 34 | 	{#if !sending}
 35 | 		<div class="flex items-center justify-center flex-col w-2/6">
 36 | 			<div class="pr-8" style="transform: rotate(90deg);">
 37 | 				<div class="form-control">
 38 | 					<label class="label cursor-pointer">
 39 | 						<span class="label-text pr-4" style="transform: rotate(-12deg);">Webpages</span>
 40 | 						<input
 41 | 							bind:group={types}
 42 | 							value={'Webpages'}
 43 | 							type="radio"
 44 | 							name="radio-10"
 45 | 							class="radio checked:bg-secondary"
 46 | 							checked
 47 | 						/>
 48 | 					</label>
 49 | 				</div>
 50 | 				<div class="form-control">
 51 | 					<label class="label cursor-pointer">
 52 | 						<span class="label-text pr-4 " style="transform: rotate(-12deg);">Webpage</span>
 53 | 						<input
 54 | 							bind:group={types}
 55 | 							value={'Webpage'}
 56 | 							type="radio"
 57 | 							name="radio-10"
 58 | 							class="radio checked:bg-blue-500"
 59 | 							checked
 60 | 						/>
 61 | 					</label>
 62 | 				</div>
 63 | 				<div class="form-control">
 64 | 					<label class="label cursor-pointer">
 65 | 						<span class="label-text pr-4" style="transform: rotate(-12deg);">Files</span>
 66 | 						<input
 67 | 							bind:group={types}
 68 | 							value={'Files'}
 69 | 							type="radio"
 70 | 							name="radio-10"
 71 | 							class="radio checked:bg-primary-500"
 72 | 							checked
 73 | 						/>
 74 | 					</label>
 75 | 				</div>
 76 | 			</div>
 77 | 			<div class="w-full">
 78 | 				{#if types === 'Files'}
 79 | 					<div in:fade>
 80 | 						<h1 class="mb-1 font-bold text-lg">Upload a file</h1>
 81 | 						<p class="mb-4">.PDF, .CSV, .EPUB, .PPTX, .DOCX, .XLSX, .SRT</p>
 82 | 						<form
 83 | 							action="?/upload"
 84 | 							method="POST"
 85 | 							enctype="multipart/form-data"
 86 | 							use:enhance
 87 | 							bind:this={formData}
 88 | 						>
 89 | 							<input
 90 | 								type="file"
 91 | 								name="file"
 92 | 								accept=".pdf, .csv, .epub, .pptx, .docx, .xlsx, .xls, .srt"
 93 | 								class="file-input w-full max-w-full mr-4 border-ll-s-1 border-2 "
 94 | 								on:change={() => {
 95 | 									formData.requestSubmit();
 96 | 									sending = true;
 97 | 								}}
 98 | 							/>
 99 | 						</form>
100 | 					</div>
101 | 				{:else if types === 'Webpage'}
102 | 					<div in:fade>
103 | 						<h1 class="mb-4 font-bold text-lg ">Enter a webpage</h1>
104 | 						<p class="mb-4">Enter URL to index body text</p>
105 | 						<form
106 | 							action="?/webpage"
107 | 							method="POST"
108 | 							bind:this={formData}
109 | 							enctype="multipart/form-data"
110 | 							use:enhance
111 | 						>
112 | 							<input
113 | 								name="link"
114 | 								type="text"
115 | 								placeholder="URL"
116 | 								class="input  w-full max-w-full mr-4 border-ll-s-1 border-2"
117 | 								bind:this={formData}
118 | 							/>
119 | 							<button
120 | 								class="btn mt-4"
121 | 								on:click={() => {
122 | 									sending = true;
123 | 									formData.requestSubmit();
124 | 								}}>SEND</button
125 | 							>
126 | 							{sending}
127 | 						</form>
128 | 					</div>
129 | 				{:else if types === 'Webpages'}
130 | 					<div in:fade>
131 | 						<h1 class="mb-4 font-bold text-lg ">Enter multiple webpages</h1>
132 | 						<p class="mb-4">Enter URLs to index body text</p>
133 | 						<form
134 | 							action="?/webpages"
135 | 							method="POST"
136 | 							bind:this={formData}
137 | 							enctype="multipart/form-data"
138 | 							use:enhance
139 | 						>
140 | 							<input
141 | 								name="collection_name"
142 | 								bind:value={collection_name}
143 | 								type="text"
144 | 								placeholder="URL"
145 | 								class="input input-sm  w-full max-w-full mr-4 border-ll-s-1 border-2 mb-4"
146 | 							/>
147 | 							{#each Array(num_links) as _, i}
148 | 								<input
149 | 									id={`link_${i}`}
150 | 									name={`link_${i}`}
151 | 									type="text"
152 | 									placeholder="URL"
153 | 									class="input   w-full max-w-full mr-4 border-ll-s-1 border-2 mb-4"
154 | 								/>
155 | 							{/each}
156 | 							{#if num_links > 1}
157 | 								<button on:click|preventDefault={removeField}>[- remove last URL]</button>
158 | 							{/if}
159 | 							{#if num_links < 5}
160 | 								<button on:click|preventDefault={addField}>[+ add a URL]</button>
161 | 							{/if}<br />
162 | 							<button
163 | 								class="btn mt-4"
164 | 								on:click={() => {
165 | 									sending = true;
166 | 									formData.requestSubmit();
167 | 								}}>SEND</button
168 | 							>
169 | 						</form>
170 | 					</div>
171 | 				{/if}
172 | 			</div>
173 | 		</div>
174 | 	{:else}
175 | 		<div
176 | 			role="status"
177 | 			class="absolute -translate-x-1/2 -translate-y-1/2 top-2/4 left-1/2"
178 | 			in:fade={{ duration: 550 }}
179 | 			out:fade
180 | 		>
181 | 			<svg
182 | 				aria-hidden="true"
183 | 				class="w-24 h-24 mr-2 animate-spin text-gray-600 fill-ll-s-1-signal"
184 | 				viewBox="0 0 100 101"
185 | 				fill="none"
186 | 				xmlns="http://www.w3.org/2000/svg"
187 | 				><path
188 | 					d="M100 50.5908C100 78.2051 77.6142 100.591 50 100.591C22.3858 100.591 0 78.2051 0 50.5908C0 22.9766 22.3858 0.59082 50 0.59082C77.6142 0.59082 100 22.9766 100 50.5908ZM9.08144 50.5908C9.08144 73.1895 27.4013 91.5094 50 91.5094C72.5987 91.5094 90.9186 73.1895 90.9186 50.5908C90.9186 27.9921 72.5987 9.67226 50 9.67226C27.4013 9.67226 9.08144 27.9921 9.08144 50.5908Z"
189 | 					fill="currentColor"
190 | 				/><path
191 | 					d="M93.9676 39.0409C96.393 38.4038 97.8624 35.9116 97.0079 33.5539C95.2932 28.8227 92.871 24.3692 89.8167 20.348C85.8452 15.1192 80.8826 10.7238 75.2124 7.41289C69.5422 4.10194 63.2754 1.94025 56.7698 1.05124C51.7666 0.367541 46.6976 0.446843 41.7345 1.27873C39.2613 1.69328 37.813 4.19778 38.4501 6.62326C39.0873 9.04874 41.5694 10.4717 44.0505 10.1071C47.8511 9.54855 51.7191 9.52689 55.5402 10.0491C60.8642 10.7766 65.9928 12.5457 70.6331 15.2552C75.2735 17.9648 79.3347 21.5619 82.5849 25.841C84.9175 28.9121 86.7997 32.2913 88.1811 35.8758C89.083 38.2158 91.5421 39.6781 93.9676 39.0409Z"
192 | 					fill="currentFill"
193 | 				/></svg
194 | 			>
195 | 			<span class="sr-only">Loading...</span>
196 | 		</div>
197 | 	{/if}
198 | </div>
199 | 


--------------------------------------------------------------------------------
/sveltekit/src/routes/api/queryGPT/+server.ts:
--------------------------------------------------------------------------------
 1 | import { json } from '@sveltejs/kit';
 2 | const baseFastapiUrl = import.meta.env.VITE_BASE_FASTAPI_URL
 3 | const bearerToken = import.meta.env.VITE_BEARER_TOKEN
 4 | import type { RequestHandler } from '@sveltejs/kit';
 5 | 
 6 | /** @type {import('./$types').RequestHandler} */
 7 | export const POST: RequestHandler = async ({ request }) => {
 8 | 	const data = await request.json();
 9 | 
10 | 	try {
11 | 		const response = await fetch(`${baseFastapiUrl}/${data.index}`, {
12 | 			method: 'POST',
13 | 			headers: {
14 | 					'Content-Type': 'application/json',
15 | 				Authorization: `Bearer ${bearerToken}`,	
16 | 			
17 | 			},
18 | 			body: JSON.stringify(data),
19 | 		});
20 | 		if (!response.ok) {
21 | 			console.log(response);
22 | 		}
23 | 
24 | 		const returnData: any = await response.json();
25 | 		return json(returnData);
26 | 	} catch (error) {
27 | 		return json({ error: 'error' }); //console.error(error)
28 | 	}
29 | };
30 | 


--------------------------------------------------------------------------------
/sveltekit/src/routes/collection/[collection]/+page.server.ts:
--------------------------------------------------------------------------------
1 | export const load = async ({ params, parent }) => {
2 | 	const { collections } = await parent();
3 | 
4 | 	return { collection: params.collection, collections: collections };
5 | };
6 | 


--------------------------------------------------------------------------------
/sveltekit/src/routes/collection/[collection]/+page.svelte:
--------------------------------------------------------------------------------
1 | <script lang="ts">
2 | 	import Chatbot from '$lib/components/chatbotstream.svelte';
3 | 	export let data;
4 | </script>
5 | 
6 | <Chatbot collection={data?.collection || ''} index="collections" collections={data.collections} />
7 | 


--------------------------------------------------------------------------------
/sveltekit/src/routes/document/[collection]/+page.server.ts:
--------------------------------------------------------------------------------
1 | export const load = async ({ params, parent }) => {
2 | 	const { collections } = await parent();
3 | 
4 | 	return { collection: params.collection, collections: collections };
5 | };
6 | 


--------------------------------------------------------------------------------
/sveltekit/src/routes/document/[collection]/+page.svelte:
--------------------------------------------------------------------------------
1 | <script lang="ts">
2 | 	import Chatbot from '$lib/components/chatbot.svelte';
3 | 	export let data;
4 | </script>
5 | 
6 | <Chatbot collection={data?.collection || ''} index="documents" collections={data.collections} />
7 | 


--------------------------------------------------------------------------------
/sveltekit/src/routes/robots.txt/+server.ts:
--------------------------------------------------------------------------------
 1 | const devRobots = `
 2 | User-agent: *
 3 | Disallow: /
 4 | `;
 5 | 
 6 | const prodRobots = `
 7 | User-agent: *
 8 | Allow: /
 9 | `;
10 | 
11 | export const GET = () => {
12 | 	return new Response(import.meta.env.VITE_NODE_ENV === 'production' ? prodRobots : devRobots);
13 | };
14 | 


--------------------------------------------------------------------------------
/sveltekit/static/favicon.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/dagthomas/LangchainComposeChatYourDocs/b13915a6e395b006ad67668c822ddef71b570b16/sveltekit/static/favicon.png


--------------------------------------------------------------------------------
/sveltekit/static/profile-image.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/dagthomas/LangchainComposeChatYourDocs/b13915a6e395b006ad67668c822ddef71b570b16/sveltekit/static/profile-image.png


--------------------------------------------------------------------------------
/sveltekit/svelte.config.js:
--------------------------------------------------------------------------------
 1 | import adapter from '@sveltejs/adapter-node';
 2 | import { vitePreprocess } from '@sveltejs/kit/vite';
 3 | 
 4 | /** @type {import('@sveltejs/kit').Config} */
 5 | const config = {
 6 | 	// Consult https://kit.svelte.dev/docs/integrations#preprocessors
 7 | 	// for more information about preprocessors
 8 | 	preprocess: vitePreprocess(),
 9 | 
10 | 	kit: {
11 | 		adapter: adapter()
12 | 	}
13 | };
14 | 
15 | export default config;
16 | 


--------------------------------------------------------------------------------
/sveltekit/tailwind.config.cjs:
--------------------------------------------------------------------------------
 1 | /** @type {import('tailwindcss').Config} */
 2 | module.exports = {
 3 | 	content: ['./src/**/*.{html,js,svelte,ts}'],
 4 | 	theme: {
 5 | 		fontFamily: {
 6 | 			sans: ['Poppins', 'sans-serif']
 7 | 		},
 8 | 
 9 | 		borderRadius: {
10 | 			none: '0',
11 | 			sm: '4px',
12 | 			md: '4px',
13 | 			lg: '10px',
14 | 			full: '16px',
15 | 			large: '24px',
16 | 			max: '9999px'
17 | 		},
18 | 		extend: {
19 | 			screens: {
20 | 				'3xl': '1600px'
21 | 			},
22 | 			borderWidth: {
23 | 				1: '1px'
24 | 			},
25 | 			colors: {
26 | 				'll-primary': '#061E30',
27 | 				'll-accent': '#ED5A55',
28 | 				'll-supportive3': '#0C3451',
29 | 				'll-accent2': '#EBF4F7',
30 | 				'll-accent3': '#11BBBB',
31 | 
32 | 				'll-p': 'rgb(7,73,117)',
33 | 				'll-p-dark': 'rgb(19,53,82)',
34 | 				'll-p-light': 'rgb(217,239,250)',
35 | 				'll-p-x-light': 'rgb(236,247,252)',
36 | 
37 | 				'll-s-1': 'rgb(195,60,102)',
38 | 				'll-s-1-signal': 'rgb(231,43,110)',
39 | 
40 | 				'll-s-2': 'rgb(94,78,151)',
41 | 				'll-s-2-light': 'rgb(155,131,188)',
42 | 
43 | 				'll-t-1': 'rgb(233,124,46)',
44 | 				'll-t-1-signal': 'rgb(248,149,58)',
45 | 
46 | 				'll-t-2': 'rgb(118,90,68)',
47 | 				'll-t-2-light': 'rgb(166,115,75)',
48 | 
49 | 				'll-b-1': 'rgb(248,232,232)',
50 | 				'll-b-2': 'rgb(239,232,245)',
51 | 				'll-b-3': 'rgb(249,230,217)',
52 | 
53 | 				'll-black-1': 'rgb(26,26,26)',
54 | 				'll-grey-1': 'rgb(232,232,232)',
55 | 				'll-grey-2': '#686868',
56 | 				'll-link-1': 'rgb(0,102,165)'
57 | 			}
58 | 		},
59 | 		plugins: []
60 | 	},
61 | 	plugins: [require('daisyui')]
62 | };
63 | 


--------------------------------------------------------------------------------
/sveltekit/tests/test.ts:
--------------------------------------------------------------------------------
1 | import { expect, test } from '@playwright/test';
2 | 
3 | test('index page has expected h1', async ({ page }) => {
4 | 	await page.goto('/');
5 | 	expect(await page.textContent('h1')).toBe('Welcome to SvelteKit');
6 | });
7 | 


--------------------------------------------------------------------------------
/sveltekit/tsconfig.json:
--------------------------------------------------------------------------------
 1 | {
 2 | 	"extends": "./.svelte-kit/tsconfig.json",
 3 | 	"compilerOptions": {
 4 | 		"allowJs": true,
 5 | 		"checkJs": true,
 6 | 		"esModuleInterop": true,
 7 | 		"forceConsistentCasingInFileNames": true,
 8 | 		"resolveJsonModule": true,
 9 | 		"skipLibCheck": true,
10 | 		"sourceMap": true,
11 | 		"strict": true,
12 | 		 "lib": [
13 |             "es5", "es6", "dom", "dom.iterable"
14 |         ]
15 | 	}
16 | 	// Path aliases are handled by https://kit.svelte.dev/docs/configuration#alias
17 | 	//
18 | 	// If you want to overwrite includes/excludes, make sure to copy over the relevant includes/excludes
19 | 	// from the referenced tsconfig.json - TypeScript does not merge them in
20 | }
21 | 


--------------------------------------------------------------------------------
/sveltekit/vite.config.ts:
--------------------------------------------------------------------------------
 1 | import { sveltekit } from '@sveltejs/kit/vite';
 2 | import type { UserConfig } from 'vite';
 3 | 
 4 | const config: UserConfig = {
 5 | 	plugins: [sveltekit()],
 6 | 	test: {
 7 | 		include: ['src/**/*.{test,spec}.{js,ts}']
 8 | 	}
 9 | };
10 | 
11 | export default config;
12 | 


--------------------------------------------------------------------------------