From 8d1989b7285a6324800b55d221124b572a165282 Mon Sep 17 00:00:00 2001 From: ydennisy Date: Sun, 24 Mar 2024 17:00:37 +0000 Subject: [PATCH] chore: split all RUN commands to debug build step --- backend/Dockerfile | 10 +++---- urls.txt => docs/urls.txt | 0 scratch.md | 57 --------------------------------------- 3 files changed, 5 insertions(+), 62 deletions(-) rename urls.txt => docs/urls.txt (100%) delete mode 100644 scratch.md diff --git a/backend/Dockerfile b/backend/Dockerfile index f425e12..52652bb 100644 --- a/backend/Dockerfile +++ b/backend/Dockerfile @@ -7,10 +7,10 @@ WORKDIR /app COPY . ./ -RUN pip install --no-cache-dir torch==2.0.1 --index-url https://download.pytorch.org/whl/cpu && \ - pip install --no-cache-dir pipenv==2023.12.1 \ - pipenv requirements > requirements.txt \ - pip install --no-cache-dir -r requirements.txt && \ - python -c 'from sentence_transformers import SentenceTransformer; SentenceTransformer("sentence-transformers/all-MiniLM-L6-v2", cache_folder="./app/artefacts")' +RUN pip install --no-cache-dir torch==2.0.1 --index-url https://download.pytorch.org/whl/cpu && +RUN pip install --no-cache-dir pipenv==2023.12.1 +RUN pipenv requirements > requirements.txt +RUN pip install --no-cache-dir -r requirements.txt && +RUN python -c 'from sentence_transformers import SentenceTransformer; SentenceTransformer("sentence-transformers/all-MiniLM-L6-v2", cache_folder="./app/artefacts")' CMD exec uvicorn app.main:app --host $HOST --port $PORT --workers 2 diff --git a/urls.txt b/docs/urls.txt similarity index 100% rename from urls.txt rename to docs/urls.txt diff --git a/scratch.md b/scratch.md deleted file mode 100644 index 155ac38..0000000 --- a/scratch.md +++ /dev/null @@ -1,57 +0,0 @@ -# Scratch - -This is a page to throw ideas, refs, etc and delete as soon as possible. - -## ideas - -- check out ra-dit paper, and its references -- we can have kg1 run locally, so all data is local, but a ActivityPub stream has things published and displayed centrally -- this would be a nice local + social -- would also allow to use DBs locally cheaper. - -## references - -- https://github.com/pgvector/pgvector-node#prisma -- https://github.com/langchain-ai/langchainjs/blob/54d9f92/langchain/src/vectorstores/prisma.ts#L130 -- https://supabase.com/docs/guides/ai -- https://supabase.com/blog/hugging-face-supabase -- https://supabase.com/partners/integrations/prisma -- https://supabase.com/blog/openai-embeddings-postgres-vector -- https://github.com/withastro/astro/blob/main/packages/markdown/remark/package.json -- https://github.com/remarkjs/remark#example-support-for-gfm-and-frontmatter -- https://github.com/remarkjs/remark-frontmatter/blob/main/lib/index.js - -## inspiration - -- [SeaGOAT](https://github.com/kantord/SeaGOAT) -- [lotion](https://github.com/Dashibase/lotion) -- [danswer](https://github.com/danswer-ai/danswer) -- [llm-app](https://github.com/pathwaycom/llm-app) -- [llama-index](https://ts.llamaindex.ai/) -- [lang-chain](https://js.langchain.com/docs/get_started/introduction) -- [Yacy](https://github.com/yacy/yacy_search_server) -- [Verba](https://github.com/weaviate/Verba) -- [ArchiveBox](https://github.com/ArchiveBox/ArchiveBox) -- [PageFind](https://github.com/CloudCannon/pagefind) -- [HPI](https://github.com/karlicoss/HPI) - -- https://github.com/ray-project/llm-applications/blob/main/notebooks/rag.ipynb -- https://github.com/supabase/vecs -- https://github.com/igorbenav/fastcrud -- https://github.com/Kludex/fastapi-microservices -- https://github.com/tiangolo/full-stack-fastapi-postgresql/ -- https://github.com/nuxt/hackernews/blob/master/layouts/default.vue - -todo: - -- add an admin flow, for different chunking (rechunking) strategies -- use a google like UI for search -- create a extension which allows to index from a right click in the browser - bitwarden extension has this. - -refs: - -- https://kuzudb.com/docusaurus/blog/llms-graphs-part-2/ - -LOOK!!!!!! - -- https://www.askmarvin.ai/docs/interactive/assistants/