seanpedrickcase commited on
Commit
49e0db8
1 Parent(s): 08eb30d

Added and replaced relevant files to download in download_model.py to allow for app use on AWS

Browse files
Files changed (2) hide show
  1. Dockerfile +2 -2
  2. download_model.py +10 -3
Dockerfile CHANGED
@@ -2,7 +2,7 @@
2
  FROM public.ecr.aws/docker/library/python:3.11.9-slim-bookworm AS builder
3
 
4
  # Install Lambda web adapter in case you want to run with with an AWS Lamba function URL (not essential if not using Lambda)
5
- #COPY --from=public.ecr.aws/awsguru/aws-lambda-adapter:0.8.3 /lambda-adapter /opt/extensions/lambda-adapter
6
 
7
  # Install system dependencies
8
  RUN apt-get update && rm -rf /var/lib/apt/lists/*
@@ -15,7 +15,7 @@ WORKDIR /src
15
  # Copy requirements file and install dependencies. Sentence transformers and Bertopic are installed without dependencies so that torch is not reinstalled.
16
  COPY requirements_aws.txt .
17
 
18
- RUN pip install torch==2.4.0+cpu --target=/install --index-url https://download.pytorch.org/whl/cpu \
19
  && pip install --no-cache-dir --target=/install sentence-transformers==3.2.0 --no-deps \
20
  && pip install --no-cache-dir --target=/install bertopic==0.16.4 --no-deps \
21
  && pip install --no-cache-dir --target=/install -r requirements_aws.txt \
 
2
  FROM public.ecr.aws/docker/library/python:3.11.9-slim-bookworm AS builder
3
 
4
  # Install Lambda web adapter in case you want to run with with an AWS Lamba function URL (not essential if not using Lambda)
5
+ #COPY --from=public.ecr.aws/awsguru/aws-lambda-adapter:0.8.4 /lambda-adapter /opt/extensions/lambda-adapter
6
 
7
  # Install system dependencies
8
  RUN apt-get update && rm -rf /var/lib/apt/lists/*
 
15
  # Copy requirements file and install dependencies. Sentence transformers and Bertopic are installed without dependencies so that torch is not reinstalled.
16
  COPY requirements_aws.txt .
17
 
18
+ RUN pip install torch==2.5.1+cpu --target=/install --index-url https://download.pytorch.org/whl/cpu \
19
  && pip install --no-cache-dir --target=/install sentence-transformers==3.2.0 --no-deps \
20
  && pip install --no-cache-dir --target=/install bertopic==0.16.4 --no-deps \
21
  && pip install --no-cache-dir --target=/install -r requirements_aws.txt \
download_model.py CHANGED
@@ -1,15 +1,22 @@
1
  from huggingface_hub import hf_hub_download
2
 
3
  # Define the repository and files to download
4
- repo_id = "mixedbread-ai/mxbai-embed-xsmall-v1" #"sentence-transformers/all-MiniLM-L6-v2" #"BAAI/bge-small-en-v1.5"
5
  files_to_download = [
6
  "config.json",
7
- "pytorch_model.bin",
 
 
 
 
 
8
  "tokenizer_config.json",
9
  "vocab.txt"
10
  ]
11
 
 
 
12
  # Download each file and save it to the /model/bge directory
13
  for file_name in files_to_download:
14
  print("Checking for file", file_name)
15
- hf_hub_download(repo_id=repo_id, filename=file_name, local_dir="/model/embed") #"/model/bge"
 
1
  from huggingface_hub import hf_hub_download
2
 
3
  # Define the repository and files to download
4
+ repo_id = "mixedbread-ai/mxbai-embed-xsmall-v1" #"sentence-transformers/all-MiniLM-L6-v2"
5
  files_to_download = [
6
  "config.json",
7
+ "config_sentence_transformers.json",
8
+ "model.safetensors",
9
+ "tokenizer.json",
10
+ "special_tokens_map.json",
11
+ "angle_config.json",
12
+ "modules.json",
13
  "tokenizer_config.json",
14
  "vocab.txt"
15
  ]
16
 
17
+ #"pytorch_model.bin",
18
+
19
  # Download each file and save it to the /model/bge directory
20
  for file_name in files_to_download:
21
  print("Checking for file", file_name)
22
+ hf_hub_download(repo_id=repo_id, filename=file_name, local_dir="/model/embed")