Spaces:

Sunbird
/

acres

Starting

App Files Files Community

Add zotero manager

by patrickcmd - opened Sep 11, 2024

base: refs/heads/main

←

from: refs/pr/1

Discussion Files changed

+266

-7317

This view is limited to 50 files because it contains too many changes. See the raw diff here.

Files changed (50) hide show

.dockerignore +0 -13
.env.example +0 -6
.flake8 +0 -5
.gitattributes +0 -1
.gitignore +0 -187
.gradio/certificate.pem +0 -31
.isort.cfg +0 -7
Dockerfile.api +0 -19
Dockerfile.api.prod +0 -72
Dockerfile.gradio +0 -21
Dockerfile.gradio.prod +0 -72
Makefile +0 -12
README.md +2 -230
__pycache__/config.cpython-311.pyc +0 -0
api.py +0 -134
app.py +69 -654
bin/cfn/ecs-delete +0 -14
bin/cfn/ecs-deploy +0 -25
bin/cfn/ecs-deploy-update-api +0 -22
bin/cfn/ecs-deploy-update-gradio +0 -22
commands.md +0 -53
config.py +5 -10
config/pdf_config.yaml +0 -0
data/.keep +0 -0
data/ebola_virus_zotero_items.json +17 -17
data/ebscohost_zotero_items.json +0 -0
data/exportedris-file-1-of-1-1_zotero_items.json +0 -813
data/gene_xpert_zotero_items.json +31 -31
data/kayongo-papers_zotero_items.json +0 -222
data/vaccine_coverage_zotero_items.json +18 -18
data/zotero-collection-pastan_zotero_items.json +0 -0
docs.py +0 -13
infra/ecs_config.template +0 -7
infra/ecs_fargate.yml +0 -581
interface.py +0 -47
pyproject.toml +0 -19
rag/__pycache__/__init__.cpython-311.pyc +0 -0
rag/__pycache__/rag_pipeline.cpython-311.pyc +0 -0
rag/rag_pipeline.py +53 -164
rag/rag_pipeline_backup.py +0 -93
requirements-dev.txt +0 -3
requirements.txt +6 -25
sample_queries.md +0 -2
study_files.json +0 -13
utils/__pycache__/__init__.cpython-311.pyc +0 -0
utils/__pycache__/prompts.cpython-311.pyc +0 -0
utils/db.py +0 -3
utils/helpers.py +29 -234
utils/pdf_processor.py +0 -222
utils/prompts.py +36 -33

.dockerignore DELETED Viewed

@@ -1,13 +0,0 @@
-**/.git
-**/.gitignore
-**/.vscode
-**/coverage
-**/.aws
-**/.ssh
-**/.terraform
-Dockerfile
-README.md
-docker-compose.yml
-**/.DS_Store
-**/venv
-**/env

.env.example DELETED Viewed

@@ -1,6 +0,0 @@
-OPENAI_API_KEY=sk-xxxxxxxxxxxxxxxx
-HF_TOKEN_PATRICK=hf_xxxxxxxxxxxxxxxxx
-ZOTERO_LIBRARY_ID=1120xxxx
-ZOTERO_API_ACCESS_KEY=Ky5RGxxxxxxxxxxxxxxxxxx
-GRADIO_URL_=http://gradio:7860/

.flake8 DELETED Viewed

@@ -1,5 +0,0 @@
-[flake8]
-    ignore = D203, E402, F403, F405, W503, W605
-    exclude = .git,env,__pycache__,docs/source/conf.py,old,build,dist, *migrations*,env,venv,alembic
-    max-complexity = 10
-    max-line-length = 119

.gitattributes CHANGED Viewed

@@ -36,4 +36,3 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *db* filter=lfs diff=lfs merge=lfs -text
 vaccine_coverage_study.db filter=lfs diff=lfs merge=lfs -text
 *.db filter=lfs diff=lfs merge=lfs -text
-*.pdf filter=lfs diff=lfs merge=lfs -text

 *db* filter=lfs diff=lfs merge=lfs -text
 vaccine_coverage_study.db filter=lfs diff=lfs merge=lfs -text
 *.db filter=lfs diff=lfs merge=lfs -text

.gitignore DELETED Viewed

@@ -1,187 +0,0 @@
-### Python ###
-# Byte-compiled / optimized / DLL files
-__pycache__/
-*.py[cod]
-*$py.class
-# C extensions
-*.so
-# Distribution / packaging
-.Python
-build/
-develop-eggs/
-dist/
-downloads/
-eggs/
-.eggs/
-lib/
-lib64/
-parts/
-sdist/
-var/
-wheels/
-share/python-wheels/
-*.egg-info/
-.installed.cfg
-*.egg
-MANIFEST
-# PyInstaller
-#  Usually these files are written by a python script from a template
-#  before PyInstaller builds the exe, so as to inject date/other infos into it.
-*.manifest
-*.spec
-# Installer logs
-pip-log.txt
-pip-delete-this-directory.txt
-# Unit test / coverage reports
-htmlcov/
-.tox/
-.nox/
-.coverage
-.coverage.*
-.cache
-nosetests.xml
-coverage.xml
-*.cover
-*.py,cover
-.hypothesis/
-.pytest_cache/
-cover/
-# Translations
-*.mo
-*.pot
-# Django stuff:
-*.log
-local_settings.py
-db.sqlite3
-db.sqlite3-journal
-# Flask stuff:
-instance/
-.webassets-cache
-# Scrapy stuff:
-.scrapy
-# Sphinx documentation
-docs/_build/
-# PyBuilder
-.pybuilder/
-target/
-# Jupyter Notebook
-.ipynb_checkpoints
-# IPython
-profile_default/
-ipython_config.py
-# pyenv
-#   For a library or package, you might want to ignore these files since the code is
-#   intended to run in multiple environments; otherwise, check them in:
-# .python-version
-# pipenv
-#   According to pypa/pipenv#598, it is recommended to include Pipfile.lock in version control.
-#   However, in case of collaboration, if having platform-specific dependencies or dependencies
-#   having no cross-platform support, pipenv may install dependencies that don't work, or not
-#   install all needed dependencies.
-#Pipfile.lock
-# poetry
-#   Similar to Pipfile.lock, it is generally recommended to include poetry.lock in version control.
-#   This is especially recommended for binary packages to ensure reproducibility, and is more
-#   commonly ignored for libraries.
-#   https://python-poetry.org/docs/basic-usage/#commit-your-poetrylock-file-to-version-control
-#poetry.lock
-# pdm
-#   Similar to Pipfile.lock, it is generally recommended to include pdm.lock in version control.
-#pdm.lock
-#   pdm stores project-wide configurations in .pdm.toml, but it is recommended to not include it
-#   in version control.
-#   https://pdm.fming.dev/latest/usage/project/#working-with-version-control
-.pdm.toml
-.pdm-python
-.pdm-build/
-# PEP 582; used by e.g. github.com/David-OConnor/pyflow and github.com/pdm-project/pdm
-__pypackages__/
-# Celery stuff
-celerybeat-schedule
-celerybeat.pid
-# SageMath parsed files
-*.sage.py
-# Environments
-.env
-.venv
-env/
-venv/
-ENV/
-env.bak/
-venv.bak/
-yes
-*.pub
-# Spyder project settings
-.spyderproject
-.spyproject
-# Rope project settings
-.ropeproject
-# mkdocs documentation
-/site
-# mypy
-.mypy_cache/
-.dmypy.json
-dmypy.json
-# Pyre type checker
-.pyre/
-# pytype static type analyzer
-.pytype/
-# Cython debug symbols
-cython_debug/
-# PyCharm
-#  JetBrains specific template is maintained in a separate JetBrains.gitignore that can
-#  be found at https://github.com/github/gitignore/blob/main/Global/JetBrains.gitignore
-#  and can be added to the global gitignore or merged into this file.  For a more nuclear
-#  option (not recommended) you can uncomment the following to ignore the entire idea folder.
-#.idea/
-### Python Patch ###
-# Poetry local configuration file - https://python-poetry.org/docs/configuration/#local-configuration
-poetry.toml
-# ruff
-.ruff_cache/
-# LSP config files
-pyrightconfig.json
-# data
-data/
-study_export_*
-study_files.db
-# study_files.json
-infra/ecs_config.toml
-aws-cli.pdf

.gradio/certificate.pem DELETED Viewed

@@ -1,31 +0,0 @@
------BEGIN CERTIFICATE-----
-MIIFazCCA1OgAwIBAgIRAIIQz7DSQONZRGPgu2OCiwAwDQYJKoZIhvcNAQELBQAw
-TzELMAkGA1UEBhMCVVMxKTAnBgNVBAoTIEludGVybmV0IFNlY3VyaXR5IFJlc2Vh
-cmNoIEdyb3VwMRUwEwYDVQQDEwxJU1JHIFJvb3QgWDEwHhcNMTUwNjA0MTEwNDM4
-WhcNMzUwNjA0MTEwNDM4WjBPMQswCQYDVQQGEwJVUzEpMCcGA1UEChMgSW50ZXJu
-ZXQgU2VjdXJpdHkgUmVzZWFyY2ggR3JvdXAxFTATBgNVBAMTDElTUkcgUm9vdCBY
-MTCCAiIwDQYJKoZIhvcNAQEBBQADggIPADCCAgoCggIBAK3oJHP0FDfzm54rVygc
-h77ct984kIxuPOZXoHj3dcKi/vVqbvYATyjb3miGbESTtrFj/RQSa78f0uoxmyF+
-0TM8ukj13Xnfs7j/EvEhmkvBioZxaUpmZmyPfjxwv60pIgbz5MDmgK7iS4+3mX6U
-A5/TR5d8mUgjU+g4rk8Kb4Mu0UlXjIB0ttov0DiNewNwIRt18jA8+o+u3dpjq+sW
-T8KOEUt+zwvo/7V3LvSye0rgTBIlDHCNAymg4VMk7BPZ7hm/ELNKjD+Jo2FR3qyH
-B5T0Y3HsLuJvW5iB4YlcNHlsdu87kGJ55tukmi8mxdAQ4Q7e2RCOFvu396j3x+UC
-B5iPNgiV5+I3lg02dZ77DnKxHZu8A/lJBdiB3QW0KtZB6awBdpUKD9jf1b0SHzUv
-KBds0pjBqAlkd25HN7rOrFleaJ1/ctaJxQZBKT5ZPt0m9STJEadao0xAH0ahmbWn
-OlFuhjuefXKnEgV4We0+UXgVCwOPjdAvBbI+e0ocS3MFEvzG6uBQE3xDk3SzynTn
-jh8BCNAw1FtxNrQHusEwMFxIt4I7mKZ9YIqioymCzLq9gwQbooMDQaHWBfEbwrbw
-qHyGO0aoSCqI3Haadr8faqU9GY/rOPNk3sgrDQoo//fb4hVC1CLQJ13hef4Y53CI
-rU7m2Ys6xt0nUW7/vGT1M0NPAgMBAAGjQjBAMA4GA1UdDwEB/wQEAwIBBjAPBgNV
-HRMBAf8EBTADAQH/MB0GA1UdDgQWBBR5tFnme7bl5AFzgAiIyBpY9umbbjANBgkq
-hkiG9w0BAQsFAAOCAgEAVR9YqbyyqFDQDLHYGmkgJykIrGF1XIpu+ILlaS/V9lZL
-ubhzEFnTIZd+50xx+7LSYK05qAvqFyFWhfFQDlnrzuBZ6brJFe+GnY+EgPbk6ZGQ
-3BebYhtF8GaV0nxvwuo77x/Py9auJ/GpsMiu/X1+mvoiBOv/2X/qkSsisRcOj/KK
-NFtY2PwByVS5uCbMiogziUwthDyC3+6WVwW6LLv3xLfHTjuCvjHIInNzktHCgKQ5
-ORAzI4JMPJ+GslWYHb4phowim57iaztXOoJwTdwJx4nLCgdNbOhdjsnvzqvHu7Ur
-TkXWStAmzOVyyghqpZXjFaH3pO3JLF+l+/+sKAIuvtd7u+Nxe5AW0wdeRlN8NwdC
-jNPElpzVmbUq4JUagEiuTDkHzsxHpFKVK7q4+63SM1N95R1NbdWhscdCb+ZAJzVc
-oyi3B43njTOQ5yOf+1CceWxG1bQVs5ZufpsMljq4Ui0/1lvh+wjChP4kqKOJ2qxq
-4RgqsahDYVvTH9w7jXbyLeiNdd8XM2w9U/t7y0Ff/9yi0GE44Za4rF2LN9d11TPA
-mRGunUHBcnWEvgJBQl9nJEiU0Zsnvgc/ubhPgXRR4Xq37Z0j4r7g1SgEEzwxA57d
-emyPxgcYxn/eR44/KJ4EBs+lVDR3veyJm+kXQ99b21/+jh5Xos1AnX5iItreGCc=
------END CERTIFICATE-----

.isort.cfg DELETED Viewed

@@ -1,7 +0,0 @@
-[settings]
-multi_line_output=3
-include_trailing_comma=True
-force_grid_wrap=0
-use_parentheses=True
-line_length=88
-skip=env,migrations,alembic,venv

Dockerfile.api DELETED Viewed

@@ -1,19 +0,0 @@
-# FastAPI Dockerfile
-FROM python:3.11.10-slim
-ENV PYTHONUNBUFFERED=1
-ENV OMP_NUM_THREADS=1
-# Set working directory
-WORKDIR /app
-# Copy app files
-COPY requirements.txt ./
-RUN pip install --no-cache-dir -r requirements.txt
-COPY . .
-# Expose port
-EXPOSE 8000
-# Command to run the FastAPI app
-CMD ["uvicorn", "api:app", "--host", "0.0.0.0", "--port", "8000"]

Dockerfile.api.prod DELETED Viewed

@@ -1,72 +0,0 @@
-###########
-# BUILDER #
-###########
-ARG AWS_ACCOUNT_ID
-# pull official base image
-FROM ${AWS_ACCOUNT_ID}.dkr.ecr.us-east-1.amazonaws.com/gradio-python:3.11.10-slim as builder
-# set work directory
-WORKDIR /app
-# set environment variables
-ENV PYTHONDONTWRITEBYTECODE 1
-ENV PYTHONUNBUFFERED 1
-ENV OMP_NUM_THREADS=1
-# install dependencies
-RUN apt-get update \
-    && apt-get -y install libpq-dev gcc \
-    && pip install psycopg
-RUN pip install --upgrade pip
-COPY ./requirements.txt /app/requirements.txt
-RUN pip wheel --no-cache-dir --no-deps --wheel-dir /app/wheels -r requirements.txt
-#########
-# FINAL #
-#########
-ARG AWS_ACCOUNT_ID
-# pull official base image
-FROM ${AWS_ACCOUNT_ID}.dkr.ecr.us-east-1.amazonaws.com/gradio-python:3.11.10-slim
-# create directory for the app user
-RUN mkdir -p /home/backend-app
-# create the app user
-RUN addgroup --system app && adduser --system --group app
-# create the appropriate directories
-ENV HOME=/home/app
-ENV BACKEND_APP_HOME=/home/app
-# RUN mkdir $BACKEND_APP_HOME
-WORKDIR $BACKEND_APP_HOME
-# install dependencies
-RUN apt-get update \
-    && apt-get -y install libpq-dev gcc \
-    && pip install psycopg
-COPY --from=builder /app/wheels /wheels
-COPY --from=builder /app/requirements.txt .
-RUN pip install --upgrade pip
-RUN pip install --no-cache /wheels/*
-# copy project
-COPY . $BACKEND_APP_HOME
-# chown all the files to the app user
-RUN chown -R app:app $BACKEND_APP_HOME
-# change to the app user
-USER app
-## Expose port
-EXPOSE 8000
-# Command to run the FastAPI app
-CMD ["uvicorn", "api:app", "--host", "0.0.0.0", "--port", "8000"]

Dockerfile.gradio DELETED Viewed

@@ -1,21 +0,0 @@
-# Gradio Dockerfile
-FROM python:3.11.10-slim
-ENV PYTHONUNBUFFERED=1
-ENV OMP_NUM_THREADS=1
-# Set working directory
-WORKDIR /app
-# Copy app files
-COPY requirements.txt ./
-RUN pip install --no-cache-dir -r requirements.txt
-COPY . .
-# Expose port
-EXPOSE 7860
-ENV GRADIO_SERVER_NAME="0.0.0.0"
-# Command to run the Gradio app
-CMD ["gradio", "app.py"]
-# CMD ["python", "app.py"]

Dockerfile.gradio.prod DELETED Viewed

@@ -1,72 +0,0 @@
-###########
-# BUILDER #
-###########
-ARG AWS_ACCOUNT_ID
-# pull official base image
-FROM ${AWS_ACCOUNT_ID}.dkr.ecr.us-east-1.amazonaws.com/gradio-python:3.11.10-slim as builder
-# set work directory
-WORKDIR /app
-# set environment variables
-ENV PYTHONDONTWRITEBYTECODE 1
-ENV PYTHONUNBUFFERED 1
-ENV OMP_NUM_THREADS=1
-# install dependencies
-RUN apt-get update \
-    && apt-get -y install libpq-dev gcc \
-    && pip install psycopg
-RUN pip install --upgrade pip
-COPY ./requirements.txt /app/requirements.txt
-RUN pip wheel --no-cache-dir --no-deps --wheel-dir /app/wheels -r requirements.txt
-#########
-# FINAL #
-#########
-ARG AWS_ACCOUNT_ID
-# pull official base image
-FROM ${AWS_ACCOUNT_ID}.dkr.ecr.us-east-1.amazonaws.com/gradio-python:3.11.10-slim
-# create directory for the app user
-RUN mkdir -p /home/backend-app
-# create the app user
-RUN addgroup --system app && adduser --system --group app
-# create the appropriate directories
-ENV HOME=/home/app
-ENV BACKEND_APP_HOME=/home/app
-# RUN mkdir $BACKEND_APP_HOME
-WORKDIR $BACKEND_APP_HOME
-# install dependencies
-RUN apt-get update \
-    && apt-get -y install libpq-dev gcc \
-    && pip install psycopg
-COPY --from=builder /app/wheels /wheels
-COPY --from=builder /app/requirements.txt .
-RUN pip install --upgrade pip
-RUN pip install --no-cache /wheels/*
-# copy project
-COPY . $BACKEND_APP_HOME
-# chown all the files to the app user
-RUN chown -R app:app $BACKEND_APP_HOME
-# change to the app user
-USER app
-# Expose port
-EXPOSE 7860
-ENV GRADIO_SERVER_NAME="0.0.0.0"
-CMD ["gradio", "app.py"]

Makefile DELETED Viewed

@@ -1,12 +0,0 @@
-.PHONY: lint-apply lint-check
-lint-check:
-	@echo "Checking for lint errors..."
-	flake8 .
-	black --check .
-	isort --check-only .
-lint-apply:
-	@echo "apply linting ..."
-	black .
-	isort .

README.md CHANGED Viewed

@@ -1,241 +1,13 @@
 ---
-title: 'ACRES: Center For Rapid Evidence Synthesis'
 emoji: 👁
 colorFrom: gray
 colorTo: pink
 sdk: gradio
-sdk_version: 5.6.0
 app_file: app.py
 pinned: false
 license: apache-2.0
 ---
 Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference
-# ACRES RAG Project
-## Project Setup
-To test and run the project locally. Clone the project from github and change directoory to `acres`.
-```sh
-git clone https://github.com/SunbirdAI/acres.git
-cd acres
-```
-Create python virtual environment and activate it.
-```sh
-python -m venv env
-source env/bin/activate
-```
-Install project dependencies
-```sh
-pip install -r requirements.txt
-```
-## Run project locally
-To test the project locally follow the steps below.
-Copy `.env.example` to `.env` and provide the correct enviroment variable values.
-```sh
-cp .env.example .env
-```
-Run the application
-```sh
-python app.py
-```
-OR
-```sh
-gradio app.py
-```
-Browse the application with the link `http://localhost:7860/`
-### Run the api
-Make sure the gradio app is running on port `7860` and then run the command below in another terminal tab in the same directory.
-```sh
-uvicorn api:app --reload
-```
-Browse the api at `http://localhost:8000/docs`
-## Run with docker
-To run the application with docker locally, first make sure you have docker installed. See [link](https://docs.docker.com/)
-Build the project docker image
-```sh
-docker build -f Dockerfile.gradio -t gradio-app .
-```
-Create docker network
-```sh
-docker network create gradio-fastapi-network
-```
-Run the docker container
-```sh
-docker run -it -p 7860:7860 --rm --name gradio --network=gradio-fastapi-network gradio-app
-```
-Browse the application with the link `http://localhost:7860/`
-To run the api with docker run the commands below. The gradio container should be run first before running the api.
-```sh
-docker build -f Dockerfile.api -t fastapi-app .
-docker run -it -p 8000:8000 --rm --name fastapi --network=gradio-fastapi-network fastapi-app
-```
-Browse the api at `http://localhost:8000/docs`
-## Deploy to AWS ECS (Elastic Container Service) with Fargate
-Install and configure the AWS CLI and aws credentials. See [link](https://docs.aws.amazon.com/cli/latest/userguide/cli-chap-welcome.html)
-OR: See the pdf document [here](https://docs.aws.amazon.com/pdfs/cli/latest/userguide/aws-cli.pdf#getting-started-quickstart)
-Now follow the steps below to deploy to AWS ECS
-Setup the default region and your aws account id
-```sh
-export AWS_DEFAULT_REGION=region # i.e us-east-1, eu-west-1
-export AWS_ACCOUNT_ID=aws_account_id # ie. 2243838xxxxxx
-```
-Login into the AWS ECR (Elastic Container Registry) via the commandline
-```sh
-aws ecr get-login-password --region $AWS_DEFAULT_REGION | docker login --username AWS --password-stdin "$AWS_ACCOUNT_ID.dkr.ecr.$AWS_DEFAULT_REGION.amazonaws.com"
-```
-Create a python image and push to ECR. This image will be used as the base image for the application image deployed on AWS ECS.
-- Create python repository
-```sh
-aws ecr create-repository \
-  --repository-name gradio-python \
-  --image-tag-mutability MUTABLE
-```
-```sh
-export ECR_PYTHON_URL="$AWS_ACCOUNT_ID.dkr.ecr.$AWS_DEFAULT_REGION.amazonaws.com/gradio-python"
-echo $ECR_PYTHON_URL
-```
-- Pull python image and tag it to the ECR url
-```sh
-docker pull python:3.11.10-slim
-docker tag python:3.11.10-slim $ECR_PYTHON_URL:3.11.10-slim
-docker push $ECR_PYTHON_URL:3.11.10-slim
-```
-- Now create application repostory
-```sh
-aws ecr create-repository \
-  --repository-name gradio-app-prod \
-  --image-tag-mutability MUTABLE
-export ECR_BACKEND_GRADIO_URL="$AWS_ACCOUNT_ID.dkr.ecr.$AWS_DEFAULT_REGION.amazonaws.com/gradio-app-prod"
-echo $ECR_BACKEND_GRADIO_URL
-```
-- Build the docker image for the production and push to ECR
-```sh
-docker build --build-arg AWS_ACCOUNT_ID=$AWS_ACCOUNT_ID -f Dockerfile.gradio.prod -t gradio-app-prod .
-docker tag gradio-app-prod:latest "${ECR_BACKEND_GRADIO_URL}:latest"
-docker push "${ECR_BACKEND_GRADIO_URL}:latest"
-```
-- Now create fastapi repostory
-```sh
-aws ecr create-repository \
-  --repository-name fastapi-api-prod \
-  --image-tag-mutability MUTABLE
-export ECR_BACKEND_FASTAPI_URL="$AWS_ACCOUNT_ID.dkr.ecr.$AWS_DEFAULT_REGION.amazonaws.com/fastapi-api-prod"
-echo $ECR_BACKEND_FASTAPI_URL
-```
-- Build the docker image for the production and push to ECR
-```sh
-docker build --build-arg AWS_ACCOUNT_ID=$AWS_ACCOUNT_ID -f Dockerfile.api.prod -t fastapi-api-prod .
-docker tag fastapi-api-prod:latest "${ECR_BACKEND_FASTAPI_URL}:latest"
-docker push "${ECR_BACKEND_FASTAPI_URL}:latest"
-```
-### Setup and Provision AWS ECS infra using AWS Cloudformation (IaC)
-#### Install
-To install the CFN-CLI run the command below
-```sh
-pip install cloudformation-cli cloudformation-cli-java-plugin cloudformation-cli-go-plugin cloudformation-cli-python-plugin cloudformation-cli-typescript-plugin
-```
-#### CFN-Toml
-```sh
-gem install cfn-toml
-```
-Copy `infra/ecs_config.template` to `infra/ecs_config.toml` and provide the correct `AWS Account ID` for the `ContainerImageGradio`
-```sh
-cp infra/ecs_config.template infra/ecs_config.toml
-```
-#### Deploy
-To deploy the ECS infra run the commands below. It provisions the cloudformation stack changeset for review.
-Log into your aws console and search for `cloudformation`. See and review the changeset. If everything is good execute the changeset to finish with the infra deployment.
-Then look for the outputs to the link for the deployed application.
-```sh
-chmod u+x bin/cfn/*
-./bin/cfn/ecs-deploy
-```
-#### Update Task Definition Deployments
-After making changes, build the docker images and then push to ECR.
-To update the task definition deployments, force the new deployment by running the commands below
-For the gradio task definition
-```sh
-./bin/cfn/ecs-deploy-update-gradio
-```
-For the api task definition
-```sh
-./bin/cfn/ecs-deploy-update-api
-```

 ---
+title: Acres
 emoji: 👁
 colorFrom: gray
 colorTo: pink
 sdk: gradio
+sdk_version: 4.42.0
 app_file: app.py
 pinned: false
 license: apache-2.0
 ---
 Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference

__pycache__/config.cpython-311.pyc ADDED Viewed

Binary file (455 Bytes). View file

api.py DELETED Viewed

@@ -1,134 +0,0 @@
-import logging
-import os
-from enum import Enum
-from typing import List, Optional, Union
-from dotenv import load_dotenv
-from fastapi import FastAPI, HTTPException
-from fastapi.middleware.cors import CORSMiddleware
-from fastapi.responses import FileResponse
-from gradio_client import Client
-from pydantic import BaseModel, ConfigDict, Field, constr
-from docs import description, tags_metadata
-load_dotenv()
-logging.basicConfig(level=logging.INFO)
-logger = logging.getLogger(__name__)
-GRADIO_URL = os.getenv("GRADIO_URL", "http://localhost:7860/")
-logger.info(f"GRADIO_URL: {GRADIO_URL}")
-client = Client(GRADIO_URL)
-app = FastAPI(
-    title="ACRES RAG API",
-    description=description,
-    openapi_tags=tags_metadata,
-)
-origins = ["*"]
-app.add_middleware(
-    CORSMiddleware,
-    allow_origins=origins,
-    allow_credentials=True,
-    allow_methods=["*"],
-    allow_headers=["*"],
-)
-class StudyVariables(str, Enum):
-    ebola_virus = "Ebola Virus"
-    vaccine_coverage = "Vaccine coverage"
-    genexpert = "GeneXpert"
-class PromptType(str, Enum):
-    default = "Default"
-    highlight = "Highlight"
-    evidence_based = "Evidence-based"
-class StudyVariableRequest(BaseModel):
-    study_variable: Union[StudyVariables, str]
-    prompt_type: PromptType
-    text: constr(min_length=1, strip_whitespace=True)  # type: ignore
-    model_config = ConfigDict(from_attributes=True)
-class DownloadCSV(BaseModel):
-    text: constr(min_length=1, strip_whitespace=True)  # type: ignore
-    model_config = ConfigDict(from_attributes=True)
-class Study(BaseModel):
-    study_name: constr(min_length=1, strip_whitespace=True)  # type: ignore
-    model_config = ConfigDict(from_attributes=True)
-class ZoteroCredentials(BaseModel):
-    library_id: constr(min_length=1, strip_whitespace=True)  # type: ignore
-    api_access_key: constr(min_length=1, strip_whitespace=True)  # type: ignore
-    model_config = ConfigDict(from_attributes=True)
-@app.post("/process_zotero_library_items", tags=["zotero"])
-def process_zotero_library_items(zotero_credentials: ZoteroCredentials):
-    result = client.predict(
-        zotero_library_id_param=zotero_credentials.library_id,
-        zotero_api_access_key=zotero_credentials.api_access_key,
-        api_name="/process_zotero_library_items",
-    )
-    return {"result": result}
-@app.post("/get_study_info", tags=["zotero"])
-def get_study_info(study: Study):
-    result = client.predict(study_name=study.study_name, api_name="/get_study_info")
-    # print(result)
-    return {"result": result}
-@app.post("/study_variables", tags=["zotero"])
-def process_study_variables(
-    study_request: StudyVariableRequest,
-):
-    result = client.predict(
-        text=study_request.text,  # "study id, study title, study design, study summary",
-        study_name=study_request.study_variable,  # "Ebola Virus",
-        prompt_type=study_request.prompt_type,  # "Default",
-        api_name="/process_multi_input",
-    )
-    print(type(result))
-    return {"result": result[0]}
-@app.post("/new_study_choices", tags=["zotero"])
-def new_study_choices():
-    result = client.predict(api_name="/new_study_choices")
-    return {"result": result}
-@app.post("/download_csv", tags=["zotero"])
-def download_csv(download_request: DownloadCSV):
-    result = client.predict(
-        markdown_content=download_request.text, api_name="/download_as_csv"
-    )
-    print(result)
-    file_path = result
-    if not file_path or not os.path.exists(file_path):
-        raise HTTPException(status_code=404, detail="File not found")
-    # Use FileResponse to send the file to the client
-    return FileResponse(
-        file_path,
-        media_type="text/csv",  # Specify the correct MIME type for CSV
-        filename=os.path.basename(
-            file_path
-        ),  # Provide a default filename for the download
-    )

app.py CHANGED Viewed

@@ -1,687 +1,102 @@
-# app.py
-import csv
-import datetime
-# from datetime import datetime
-import io
-import json
-import logging
-import os
-from typing import Any, List, Tuple, Union
 import gradio as gr
-import openai
-from cachetools import LRUCache
-from dotenv import load_dotenv
-from slugify import slugify
-from config import OPENAI_API_KEY, STUDY_FILES
-from interface import create_chat_interface
 from rag.rag_pipeline import RAGPipeline
-from utils.db import (
-    add_study_files_to_db,
-    create_db_and_tables,
-    get_all_study_files,
-    get_study_file_by_name,
-    get_study_files_by_library_id,
-)
-from utils.helpers import (
-    add_study_files_to_chromadb,
-    append_to_study_files,
-    chromadb_client,
-    create_directory,
 )
-from utils.pdf_processor import PDFProcessor
-from utils.prompts import evidence_based_prompt, highlight_prompt
-from utils.zotero_manager import ZoteroManager
-data_directory = "data"
-create_directory(data_directory)
-# Configure logging
-logging.basicConfig(level=logging.INFO)
-logger = logging.getLogger(__name__)
-load_dotenv()
-openai.api_key = OPENAI_API_KEY
-# Initialize ChromaDB with study files
-add_study_files_to_chromadb("study_files.json", "study_files_collection")
-# Create sqlite study file data table
-create_db_and_tables()
 # Cache for RAG pipelines
 rag_cache = {}
-cache = LRUCache(maxsize=100)
-def get_cache_value(key):
-    return cache.get(key)
-zotero_library_id = get_cache_value("zotero_library_id")
-logger.info(f"zotero_library_id cache: {zotero_library_id}")
-def get_rag_pipeline(study_name: str) -> RAGPipeline:
-    """Get or create a RAGPipeline instance for the given study by querying ChromaDB."""
     if study_name not in rag_cache:
-        study = get_study_file_by_name(study_name)
-        if not study:
             raise ValueError(f"Invalid study name: {study_name}")
-        study_file = study.file_path
-        logger.info(f"study_file: {study_file}")
-        if not study_file:
-            raise ValueError(f"File path not found for study name: {study_name}")
-        rag_cache[study_name] = RAGPipeline(study_file)
     return rag_cache[study_name]
-def get_study_info(study_name: Union[str, list]) -> str:
-    """Retrieve information about the specified study."""
-    if isinstance(study_name, list):
-        study_name = study_name[0] if study_name else None
-    if not study_name:
-        return "No study selected"
-    study = get_study_file_by_name(study_name)
-    logger.info(f"Study: {study}")
-    if not study:
-        raise ValueError(f"Invalid study name: {study_name}")
-    study_file = study.file_path
-    logger.info(f"study_file: {study_file}")
-    if not study_file:
-        raise ValueError(f"File path not found for study name: {study_name}")
-    with open(study_file, "r") as f:
-        data = json.load(f)
-    return f"### Number of documents: {len(data)}"
-def markdown_table_to_csv(markdown_text: str) -> str:
-    """Convert a markdown table to CSV format."""
-    lines = [line.strip() for line in markdown_text.split("\n") if line.strip()]
-    table_lines = [line for line in lines if line.startswith("|")]
-    if not table_lines:
-        return ""
-    csv_data = []
-    for line in table_lines:
-        if "---" in line:
-            continue
-        # Split by |, remove empty strings, and strip whitespace
-        cells = [cell.strip() for cell in line.split("|") if cell.strip()]
-        csv_data.append(cells)
-    output = io.StringIO()
-    writer = csv.writer(output)
-    writer.writerows(csv_data)
-    return output.getvalue()
-def cleanup_temp_files():
-    """Clean up old temporary files."""
-    try:
-        current_time = datetime.datetime.now()
-        for file in os.listdir():
-            if file.startswith("study_export_") and file.endswith(".csv"):
-                file_time = datetime.datetime.fromtimestamp(os.path.getmtime(file))
-                # Calculate the time difference in seconds
-                time_difference = (current_time - file_time).total_seconds()
-                if time_difference > 20:  # 5 minutes in seconds
-                    try:
-                        os.remove(file)
-                    except Exception as e:
-                        logger.warning(f"Failed to remove temp file {file}: {e}")
-    except Exception as e:
-        logger.warning(f"Error during cleanup: {e}")
-def chat_function(message: str, study_name: str, prompt_type: str) -> str:
-    """Process a chat message and generate a response using the RAG pipeline."""
-    if not message.strip():
-        return "Please enter a valid query."
-    rag = get_rag_pipeline(study_name)
-    logger.info(f"rag: {rag}")
-    prompt = {
-        "Highlight": highlight_prompt,
-        "Evidence-based": evidence_based_prompt,
-    }.get(prompt_type)
-    response, _ = rag.query(message, prompt_template=prompt)  # Unpack the tuple
-    return response
-def process_zotero_library_items(
-    zotero_library_id_param: str, zotero_api_access_key: str
-) -> str:
-    global zotero_library_id
-    if not zotero_library_id_param or not zotero_api_access_key:
-        return "Please enter your zotero library Id and API Access Key"
-    zotero_library_id = zotero_library_id_param
-    cache["zotero_library_id"] = zotero_library_id
-    zotero_library_type = "user"  # or "group"
-    zotero_api_access_key = zotero_api_access_key
-    message = ""
-    try:
-        zotero_manager = ZoteroManager(
-            zotero_library_id, zotero_library_type, zotero_api_access_key
-        )
-        zotero_collections = zotero_manager.get_collections()
-        zotero_collection_lists = zotero_manager.list_zotero_collections(
-            zotero_collections
-        )
-        filtered_zotero_collection_lists = (
-            zotero_manager.filter_and_return_collections_with_items(
-                zotero_collection_lists
-            )
-        )
-        study_files_data = {}  # Dictionary to collect items for ChromaDB
-        for collection in filtered_zotero_collection_lists:
-            collection_name = collection.get("name")
-            if collection_name not in STUDY_FILES:
-                collection_key = collection.get("key")
-                collection_items = zotero_manager.get_collection_items(collection_key)
-                zotero_collection_items = (
-                    zotero_manager.get_collection_zotero_items_by_key(collection_key)
-                )
-                # Export zotero collection items to json
-                zotero_items_json = zotero_manager.zotero_items_to_json(
-                    zotero_collection_items
-                )
-                export_file = f"{slugify(collection_name)}_zotero_items.json"
-                zotero_manager.write_zotero_items_to_json_file(
-                    zotero_items_json, f"data/{export_file}"
-                )
-                append_to_study_files(
-                    "study_files.json", collection_name, f"data/{export_file}"
-                )
-                # Collect for ChromaDB
-                study_files_data[collection_name] = f"data/{export_file}"
-                # Update in-memory STUDY_FILES for reference in current session
-                STUDY_FILES.update({collection_name: f"data/{export_file}"})
-                logger.info(f"STUDY_FILES: {STUDY_FILES}")
-        # After loop, add all collected data to ChromaDB
-        add_study_files_to_chromadb("study_files.json", "study_files_collection")
-        # Add collected data to sqlite
-        add_study_files_to_db("study_files.json", zotero_library_id)
-        # Dynamically update study choices
-        global study_choices
-        study_choices = [
-            file.name for file in get_study_files_by_library_id([zotero_library_id])
-        ]
-        message = "Successfully processed items in your zotero library"
-    except Exception as e:
-        message = f"Error process your zotero library: {str(e)}"
-    return message
-process_zotero_library_items(
-    os.getenv("ZOTERO_LIBRARY_ID"), os.getenv("ZOTERO_API_ACCESS_KEY")
-)
-def refresh_study_choices():
-    """
-    Refresh study choices for a specific dropdown instance.
-    :return: Updated Dropdown with current study choices
-    """
-    global study_choices, zotero_library_id
-    zotero_library_id = get_cache_value("zotero_library_id")
-    logger.info(f"zotero_library_id refreshed: {zotero_library_id}")
-    study_choices = [
-        file.name for file in get_study_files_by_library_id([zotero_library_id])
-    ]
-    logger.info(f"Study choices refreshed: {study_choices}")
-    return study_choices
-def new_study_choices():
-    """
-    Refresh study choices for a specific dropdown instance.
-    """
-    study_choices = refresh_study_choices()
-    study_choices = ", ".join(study_choices)
-    return f"**Your studies are: {study_choices}**"
-def process_multi_input(text, study_name, prompt_type):
-    # Split input based on commas and strip any extra spaces
-    variable_list = [word.strip().upper() for word in text.split(",")]
-    user_message = f"Extract and present in a tabular format the following variables for each {study_name} study: {', '.join(variable_list)}"
-    logger.info(f"User message: {user_message}")
-    response = chat_function(user_message, study_name, prompt_type)
-    return [response, gr.update(visible=True)]
-def download_as_csv(markdown_content):
-    """Convert markdown table to CSV and provide for download."""
-    if not markdown_content:
-        return None
-    csv_content = markdown_table_to_csv(markdown_content)
-    if not csv_content:
-        return None
-    # Create temporary file with actual content
-    timestamp = datetime.datetime.now().strftime("%Y%m%d_%H%M%S")
-    temp_path = f"study_export_{timestamp}.csv"
-    with open(temp_path, "w", newline="", encoding="utf-8") as f:
-        f.write(csv_content)
-    return temp_path
-# PDF Support
-def process_pdf_uploads(files: List[gr.File], collection_name: str) -> str:
-    """Process uploaded PDF files and add them to the system."""
-    if not files or not collection_name:
-        return "Please upload PDF files and provide a collection name"
-    try:
-        processor = PDFProcessor()
-        # Save uploaded files temporarily
-        file_paths = []
-        for file in files:
-            # Get the actual file path from the Gradio File object
-            if hasattr(file, "name"):  # If it's already a path
-                temp_path = file.name
-            else:  # If it needs to be saved
-                temp_path = os.path.join(processor.upload_dir, file.orig_name)
-                file.save(temp_path)
-            file_paths.append(temp_path)
-        # Process PDFs
-        output_path = processor.process_pdfs(file_paths, collection_name)
-        # Add to study files and ChromaDB
-        collection_id = f"pdf_{slugify(collection_name)}"
-        append_to_study_files("study_files.json", collection_id, output_path)
-        add_study_files_to_chromadb("study_files.json", "study_files_collection")
-        # Cleanup temporary files if they were created by us
-        for path in file_paths:
-            if path.startswith(processor.upload_dir):
-                try:
-                    os.remove(path)
-                except Exception as e:
-                    logger.warning(f"Failed to remove temporary file {path}: {e}")
-        return f"Successfully processed PDFs into collection: {collection_id}"
-    except Exception as e:
-        logger.error(f"Error in process_pdf_uploads: {str(e)}")
-        return f"Error processing PDF files: {str(e)}"
-def chat_response(
-    message: str,
-    history: List[Tuple[str, str]],
-    study_name: str,
-    pdf_processor: PDFProcessor,
-) -> Tuple[List[Tuple[str, str]], str, Any]:
-    """Generate chat response and update history."""
-    if not message.strip():
-        return history, None, None
     rag = get_rag_pipeline(study_name)
-    response, source_info = rag.query(message)
-    history.append((message, response))
-    # Generate PDF preview if source information is available
-    # preview_image = None
-    if (
-        source_info
-        and source_info.get("source_file")
-        and source_info.get("page_numbers")
-    ):
-        try:
-            # Get the first page number from the source
-            page_num = source_info["page_numbers"][0]
-        except Exception as e:
-            logger.error(f"Error generating PDF preview: {str(e)}")
-    return history
-def create_gr_interface() -> gr.Blocks:
-    """Create and configure the Gradio interface for the RAG platform."""
-    global zotero_library_id
-    with gr.Blocks(theme=gr.themes.Base()) as demo:
-        gr.Markdown("# ACRES RAG Platform")
-        with gr.Tabs() as tabs:
-            # Tab 1: Original Study Analysis Interface
-            with gr.Tab("Study Analysis"):
-                with gr.Row():
-                    with gr.Column(scale=1):
-                        gr.Markdown("### Zotero Credentials")
-                        zotero_library_id_param = gr.Textbox(
-                            label="Zotero Library ID",
-                            type="password",
-                            placeholder="Enter Your Zotero Library ID here...",
-                        )
-                        zotero_api_access_key = gr.Textbox(
-                            label="Zotero API Access Key",
-                            type="password",
-                            placeholder="Enter Your Zotero API Access Key...",
-                        )
-                        process_zotero_btn = gr.Button("Process your Zotero Library")
-                        zotero_output = gr.Markdown(label="Zotero")
-                        local_storage_state = gr.BrowserState(
-                            {"zotero_library_id": "", "study_choices": []}
-                        )
-                        gr.Markdown("### Study Information")
-                        zotero_library_id = zotero_library_id_param.value
-                        if zotero_library_id is None:
-                            zotero_library_id = get_cache_value("zotero_library_id")
-                        logger.info(f"zotero_library_id: =====> {zotero_library_id}")
-                        study_choices = refresh_study_choices()
-                        logger.info(f"study_choices_db: =====> {study_choices}")
-                        study_dropdown = gr.Dropdown(
-                            choices=study_choices,
-                            label="Select Study",
-                            value=(study_choices[0] if study_choices else None),
-                            allow_custom_value=True,
-                        )
-                        # In Gradio interface setup
-                        refresh_button = gr.Button("Refresh Studies")
-                        study_info = gr.Markdown(label="Study Details")
-                        new_studies = gr.Markdown(label="Your Studies")
-                        prompt_type = gr.Radio(
-                            ["Default", "Highlight", "Evidence-based"],
-                            label="Prompt Type",
-                            value="Default",
-                        )
-                        @demo.load(
-                            inputs=[local_storage_state],
-                            outputs=[zotero_library_id_param],
-                        )
-                        def load_from_local_storage(saved_values):
-                            print("loading from local storage", saved_values)
-                            return saved_values.get("zotero_library_id")
-                        @gr.on(
-                            [
-                                zotero_library_id_param.change,
-                                process_zotero_btn.click,
-                                refresh_button.click,
-                            ],
-                            inputs=[zotero_library_id_param],
-                            outputs=[local_storage_state],
-                        )
-                        def save_to_local_storage(zotero_library_id_param):
-                            study_choices = refresh_study_choices()
-                            return {
-                                "zotero_library_id": zotero_library_id_param,
-                                "study_choices": study_choices,
-                            }
-                    with gr.Column(scale=3):
-                        gr.Markdown("### Study Variables")
-                        with gr.Row():
-                            study_variables = gr.Textbox(
-                                show_label=False,
-                                placeholder="Type your variables separated by commas e.g (Study ID, Study Title, Authors etc)",
-                                scale=4,
-                                lines=1,
-                                autofocus=True,
-                            )
-                            submit_btn = gr.Button("Submit", scale=1)
-                        answer_output = gr.Markdown(label="Answer")
-                        download_btn = gr.DownloadButton(
-                            "Download as CSV",
-                            variant="primary",
-                            size="sm",
-                            scale=1,
-                            visible=False,
-                        )
-            # Tab 2: PDF Chat Interface
-            with gr.Tab("PDF Chat"):
-                pdf_processor = PDFProcessor()
-                with gr.Row():
-                    # Left column: Chat and Input
-                    with gr.Column(scale=7):
-                        chat_history = gr.Chatbot(
-                            value=[], height=600, show_label=False
-                        )
-                        with gr.Row():
-                            query_input = gr.Textbox(
-                                show_label=False,
-                                placeholder="Ask a question about your PDFs...",
-                                scale=8,
-                            )
-                            chat_submit_btn = gr.Button(
-                                "Send", scale=2, variant="primary"
-                            )
-                    # Right column: PDF Preview and Upload
-                    with gr.Column(scale=3):
-                        # pdf_preview = gr.Image(label="Source Page", height=600)
-                        source_info = gr.Markdown(
-                            label="Sources",
-                            value="No sources available yet."
-                        )
-                        with gr.Row():
-                            pdf_files = gr.File(
-                                file_count="multiple",
-                                file_types=[".pdf"],
-                                label="Upload PDFs",
-                            )
-                        with gr.Row():
-                            collection_name = gr.Textbox(
-                                label="Collection Name",
-                                placeholder="Name this PDF collection...",
-                            )
-                        with gr.Row():
-                            upload_btn = gr.Button("Process PDFs", variant="primary")
-                        pdf_status = gr.Markdown()
-                        current_collection = gr.State(value=None)
-        # Event handlers for Study Analysis tab
-        process_zotero_btn.click(
-            process_zotero_library_items,
-            inputs=[zotero_library_id_param, zotero_api_access_key],
-            outputs=[zotero_output],
         )
-        study_dropdown.change(
-            get_study_info, inputs=[study_dropdown], outputs=[study_info]
-        )
-        submit_btn.click(
-            process_multi_input,
-            inputs=[study_variables, study_dropdown, prompt_type],
-            outputs=[answer_output, download_btn],
-        )
-        download_btn.click(
-            fn=download_as_csv, inputs=[answer_output], outputs=[download_btn]
-        ).then(fn=cleanup_temp_files, inputs=None, outputs=None)
-        refresh_button.click(
-            fn=new_study_choices,
-            outputs=[new_studies],  # Update the same dropdown
         )
-        # Event handlers for PDF Chat tab
-        def handle_pdf_upload(files, name):
-            if not name:
-                return "Please provide a collection name", None
-            if not files:
-                return "Please select PDF files", None
-            try:
-                processor = PDFProcessor()
-                # Process PDFs
-                output_path = processor.process_pdfs(files, name)
-                collection_id = f"pdf_{slugify(name)}"
-                # Add to study files JSON
-                append_to_study_files("study_files.json", collection_id, output_path)
-                # Add to ChromaDB
-                add_study_files_to_chromadb("study_files.json", "study_files_collection")
-                # Add to SQLite database - this is the crucial missing step
-                add_study_files_to_db("study_files.json", "local")  # Add library_id parameter
-                return f"Successfully processed PDFs into collection: {collection_id}", collection_id
-            except Exception as e:
-                logger.error(f"Error in handle_pdf_upload: {str(e)}")
-                return f"Error: {str(e)}", None
-        def add_message(history, message):
-            """Add user message to chat history."""
-            if not message.strip():
-                raise gr.Error("Please enter a message")
-            history = history + [(message, None)]
-            return history, "", None
-        def format_source_info(source_nodes) -> str:
-            """Format source information into a markdown string."""
-            if not source_nodes:
-                return "No source information available"
-            sources_md = "### Sources\n\n"
-            seen_sources = set()  # To track unique sources
-            for idx, node in enumerate(source_nodes, 1):
-                metadata = node.metadata
-                if not metadata:
-                    continue
-                source_key = (metadata.get('source_file', ''), metadata.get('page_number', 0))
-                if source_key in seen_sources:
-                    continue
-                seen_sources.add(source_key)
-                title = metadata.get('title', os.path.basename(metadata.get('source_file', 'Unknown')))
-                page = metadata.get('page_number', 'N/A')
-                sources_md += f"{idx}. **{title}** - Page {page}\n"
-            return sources_md
-        def generate_chat_response(history, collection_id, pdf_processor):
-            """Generate response for the last message in history."""
-            if not collection_id:
-                raise gr.Error("Please upload PDFs first")
-            if len(history) == 0:
-                return history, None
-            last_message = history[-1][0]
-            try:
-                # Get response and source info
-                rag = get_rag_pipeline(collection_id)
-                response_text, source_nodes = rag.query(last_message)
-                # Format sources info
-                sources_md = "### Top Sources\n\n"
-                if source_nodes and len(source_nodes) > 0:
-                    seen_sources = set()
-                    source_count = 0
-                    # Only process up to 3 sources
-                    for node in source_nodes:
-                        if source_count >= 3:  # Stop after 3 sources
-                            break
-                        if not hasattr(node, 'metadata'):
-                            continue
-                        metadata = node.metadata
-                        source_key = (
-                            metadata.get('source_file', ''),
-                            metadata.get('page_number', 0)
-                        )
-                        if source_key in seen_sources:
-                            continue
-                        seen_sources.add(source_key)
-                        source_count += 1
-                        title = metadata.get('title', 'Unknown')
-                        if not title or title == 'Unknown':
-                            title = os.path.basename(metadata.get('source_file', 'Unknown Document'))
-                        page = metadata.get('page_number', 'N/A')
-                        sources_md += f"{source_count}. **{title}** - Page {page}\n"
-                    if source_count == 0:
-                        sources_md = "No source information available"
-                else:
-                    sources_md = "No source information available"
-                # Update history with response
-                history[-1] = (last_message, response_text)
-                return history, sources_md
-            except Exception as e:
-                logger.error(f"Error in generate_chat_response: {str(e)}")
-                history[-1] = (last_message, f"Error: {str(e)}")
-                return history, "Error retrieving sources"
-        # Update PDF event handlers
-        upload_btn.click(  # Change from pdf_files.upload to upload_btn.click
-            handle_pdf_upload,
-            inputs=[pdf_files, collection_name],
-            outputs=[pdf_status, current_collection],
-        )
-        # Fixed chat event handling
-        chat_submit_btn.click(
-            add_message,
-            inputs=[chat_history, query_input],
-            outputs=[chat_history, query_input],
-        ).success(
-            generate_chat_response,
-            inputs=[chat_history, current_collection],
-            outputs=[chat_history, source_info],
-        )
-    return demo
-demo = create_gr_interface()
 if __name__ == "__main__":
-    # demo = create_gr_interface()
     demo.launch(share=True, debug=True)

 import gradio as gr
+import json
 from rag.rag_pipeline import RAGPipeline
+from utils.prompts import highlight_prompt, evidence_based_prompt
+from utils.prompts import (
+    sample_questions,
 )
+from config import STUDY_FILES
 # Cache for RAG pipelines
 rag_cache = {}
+def get_rag_pipeline(study_name):
     if study_name not in rag_cache:
+        study_file = STUDY_FILES.get(study_name)
+        if study_file:
+            rag_cache[study_name] = RAGPipeline(study_file)
+        else:
             raise ValueError(f"Invalid study name: {study_name}")
     return rag_cache[study_name]
+def query_rag(study_name: str, question: str, prompt_type: str) -> str:
     rag = get_rag_pipeline(study_name)
+    if prompt_type == "Highlight":
+        prompt = highlight_prompt
+    elif prompt_type == "Evidence-based":
+        prompt = evidence_based_prompt
+    else:
+        prompt = None
+    # Use the prepared context in the query
+    response = rag.query(question, prompt_template=prompt)
+    return response.response
+def get_study_info(study_name):
+    study_file = STUDY_FILES.get(study_name)
+    if study_file:
+        with open(study_file, "r") as f:
+            data = json.load(f)
+        return f"**Number of documents:** {len(data)}\n\n**First document title:** {data[0]['title']}"
+    else:
+        return "Invalid study name"
+def update_sample_questions(study_name):
+    return gr.Dropdown(choices=sample_questions.get(study_name, []), interactive=True)
+with gr.Blocks() as demo:
+    gr.Markdown("# RAG Pipeline Demo")
+    with gr.Row():
+        study_dropdown = gr.Dropdown(
+            choices=list(STUDY_FILES.keys()), label="Select Study"
         )
+        study_info = gr.Markdown(label="Study Information")
+    study_dropdown.change(get_study_info, inputs=[study_dropdown], outputs=[study_info])
+    with gr.Row():
+        question_input = gr.Textbox(label="Enter your question")
+        sample_question_dropdown = gr.Dropdown(
+            choices=[], label="Sample Questions", interactive=True
         )
+    study_dropdown.change(
+        update_sample_questions,
+        inputs=[study_dropdown],
+        outputs=[sample_question_dropdown],
+    )
+    sample_question_dropdown.change(
+        lambda x: x, inputs=[sample_question_dropdown], outputs=[question_input]
+    )
+    prompt_type = gr.Radio(
+        [
+            "Default",
+            "Highlight",
+            "Evidence-based",
+        ],
+        label="Prompt Type",
+        value="Default",
+    )
+    submit_button = gr.Button("Submit")
+    answer_output = gr.Markdown(label="Answer")
+    submit_button.click(
+        query_rag,
+        inputs=[study_dropdown, question_input, prompt_type],
+        outputs=[answer_output],
+    )
 if __name__ == "__main__":
     demo.launch(share=True, debug=True)

bin/cfn/ecs-delete DELETED Viewed

@@ -1,14 +0,0 @@
-#! /usr/bin/env bash
-set -e # stop the execution of the script if it fails
-CONFIG_PATH="/Users/patrickcmd/Projects/sunbirdai/Acres/infra/ecs_config.toml"
-REGION=$(cfn-toml key deploy.region -t $CONFIG_PATH)
-STACK_NAME=$(cfn-toml key deploy.stack_name -t $CONFIG_PATH)
-aws cloudformation delete-stack \
-    --stack-name $STACK_NAME \
-    --region $REGION \
-    --profile sunbirdai

bin/cfn/ecs-deploy DELETED Viewed

@@ -1,25 +0,0 @@
-#! /usr/bin/env bash
-set -e # stop the execution of the script if it fails
-CFN_PATH="/Users/patrickcmd/Projects/sunbirdai/Acres/infra/ecs_fargate.yml"
-CONFIG_PATH="/Users/patrickcmd/Projects/sunbirdai/Acres/infra/ecs_config.toml"
-echo $CFN_PATH
-cfn-lint $CFN_PATH
-BUCKET=$(cfn-toml key deploy.bucket -t $CONFIG_PATH)
-REGION=$(cfn-toml key deploy.region -t $CONFIG_PATH)
-STACK_NAME=$(cfn-toml key deploy.stack_name -t $CONFIG_PATH)
-PARAMETERS=$(cfn-toml params v2 -t $CONFIG_PATH)
-aws cloudformation deploy \
-  --stack-name $STACK_NAME \
-  --s3-bucket $BUCKET \
-  --s3-prefix acres-rag \
-  --region $REGION \
-  --template-file "$CFN_PATH" \
-  --no-execute-changeset \
-  --tags group=acres-rag \
-  --parameter-overrides $PARAMETERS \
-  --capabilities CAPABILITY_NAMED_IAM \
-  --profile acres

bin/cfn/ecs-deploy-update-api DELETED Viewed

@@ -1,22 +0,0 @@
-#! /usr/bin/env bash
-set -e
-CLUSTER_NAME="rag-ecs-cluster"
-FASTAPI_SERVICE_NAME="dev-acres-fastapi"
-TASK_FASTAPI_DEFINTION_FAMILY="dev-acres-fastapi"
-LATEST_FASTAPI_TASK_DEFINITION_ARN=$(aws ecs describe-task-definition \
---task-definition $TASK_FASTAPI_DEFINTION_FAMILY \
---query 'taskDefinition.taskDefinitionArn' \
---output text)
-echo "TASK DEF ARN:"
-echo $LATEST_FASTAPI_TASK_DEFINITION_ARN
-aws ecs update-service \
---cluster $CLUSTER_NAME \
---service $FASTAPI_SERVICE_NAME \
---task-definition $LATEST_FASTAPI_TASK_DEFINITION_ARN \
---force-new-deployment

bin/cfn/ecs-deploy-update-gradio DELETED Viewed

@@ -1,22 +0,0 @@
-#! /usr/bin/env bash
-set -e
-CLUSTER_NAME="rag-ecs-cluster"
-SERVICE_NAME="dev-acres-gradio"
-TASK_GRADIO_DEFINTION_FAMILY="dev-acres-gradio"
-LATEST_GRADIO_TASK_DEFINITION_ARN=$(aws ecs describe-task-definition \
---task-definition $TASK_GRADIO_DEFINTION_FAMILY \
---query 'taskDefinition.taskDefinitionArn' \
---output text)
-echo "TASK DEF ARN:"
-echo $LATEST_GRADIO_TASK_DEFINITION_ARN
-aws ecs update-service \
---cluster $CLUSTER_NAME \
---service $SERVICE_NAME \
---task-definition $LATEST_GRADIO_TASK_DEFINITION_ARN \
---force-new-deployment

commands.md DELETED Viewed

@@ -1,53 +0,0 @@
-docker network create gradio-fastapi-network
-docker run -it -p 7860:7860 --rm --name gradio --network=gradio-fastapi-network gradio-app
-docker run -it -p 7860:7860 --rm --name gradio --network=gradio-fastapi-network gradio-app-prod
-export AWS_DEFAULT_REGION=us-east-1
-export AWS_ACCOUNT_ID=2244276xxxxx
-aws ecr get-login-password --region $AWS_DEFAULT_REGION | docker login --username AWS --password-stdin "$AWS_ACCOUNT_ID.dkr.ecr.$AWS_DEFAULT_REGION.amazonaws.com"
-aws ecr create-repository \
-  --repository-name gradio-python \
-  --image-tag-mutability MUTABLE
-export ECR_PYTHON_URL="$AWS_ACCOUNT_ID.dkr.ecr.$AWS_DEFAULT_REGION.amazonaws.com/gradio-python"
-echo $ECR_PYTHON_URL
-docker pull python:3.11.10-slim
-docker tag python:3.11.10-slim $ECR_PYTHON_URL:3.11.10-slim
-docker push $ECR_PYTHON_URL:3.11.10-slim
-aws ecr create-repository \
-  --repository-name gradio-app-prod \
-  --image-tag-mutability MUTABLE
-export ECR_BACKEND_GRADIO_URL="$AWS_ACCOUNT_ID.dkr.ecr.$AWS_DEFAULT_REGION.amazonaws.com/gradio-app-prod"
-echo $ECR_BACKEND_GRADIO_URL
-docker build --build-arg AWS_ACCOUNT_ID=2244276xxxxx -t your-image-name .
-docker build -f Dockerfile.gradio.prod -t gradio-app-prod .
-docker build --build-arg AWS_ACCOUNT_ID=$AWS_ACCOUNT_ID -f Dockerfile.gradio.prod -t gradio-app-prod .
-docker tag gradio-app-prod:latest "${ECR_BACKEND_GRADIO_URL}:latest"
-docker push "${ECR_BACKEND_GRADIO_URL}:latest"
-docker build -f Dockerfile.api -t fastapi-app .
-docker run -it -p 8000:8000 --rm --name fastapi --network=gradio-fastapi-network fastapi-app
-aws ecr create-repository \
-  --repository-name fastapi-api-prod \
-  --image-tag-mutability MUTABLE
-export ECR_BACKEND_FASTAPI_URL="$AWS_ACCOUNT_ID.dkr.ecr.$AWS_DEFAULT_REGION.amazonaws.com/fastapi-api-prod"
-echo $ECR_BACKEND_FASTAPI_URL
-docker build --build-arg AWS_ACCOUNT_ID=$AWS_ACCOUNT_ID -f Dockerfile.api.prod -t fastapi-api-prod .
-docker tag fastapi-api-prod:latest "${ECR_BACKEND_FASTAPI_URL}:latest"
-docker push "${ECR_BACKEND_FASTAPI_URL}:latest"

config.py CHANGED Viewed

@@ -1,14 +1,9 @@
-# config.py
 import os
-from dotenv import load_dotenv
-from utils.helpers import read_study_files
-load_dotenv()
 OPENAI_API_KEY = os.getenv("OPENAI_API_KEY")
-STUDY_FILES = read_study_files(("study_files.json"))

 import os
 OPENAI_API_KEY = os.getenv("OPENAI_API_KEY")
+STUDY_FILES = {
+    "Vaccine Coverage": "data/vaccine_coverage_zotero_items.json",
+    "Ebola Virus": "data/ebola_virus_zotero_items.json",
+    "Gene Xpert": "data/gene_xpert_zotero_items.json",
+}

config/pdf_config.yaml DELETED Viewed

File without changes

data/.keep DELETED Viewed

File without changes

data/ebola_virus_zotero_items.json CHANGED Viewed

@@ -11,7 +11,7 @@
       "Marco Tuccori"
     ],
     "doi": "",
-    "date": "2020",
     "item_type": "journalArticle",
     "url": ""
   },
@@ -28,7 +28,7 @@
       "Sina Bavari"
     ],
     "doi": "10.1146/annurev-pharmtox-010716-105055",
-    "date": "2017-01-06",
     "item_type": "journalArticle",
     "url": "https://www.annualreviews.org/doi/10.1146/annurev-pharmtox-010716-105055"
   },
@@ -48,7 +48,7 @@
       "Xiangguo Qiu"
     ],
     "doi": "10.1016/j.molmed.2017.07.002",
-    "date": "09/2017",
     "item_type": "journalArticle",
     "url": "https://linkinghub.elsevier.com/retrieve/pii/S1471491417301090"
   },
@@ -66,7 +66,7 @@
       "Robert L. Gottlieb"
     ],
     "doi": "10.1038/s41577-021-00542-x",
-    "date": "06/2021",
     "item_type": "journalArticle",
     "url": "https://www.nature.com/articles/s41577-021-00542-x"
   },
@@ -85,7 +85,7 @@
       "M. P. Grobusch"
     ],
     "doi": "10.1080/13543784.2016.1240785",
-    "date": "2016-11-01",
     "item_type": "journalArticle",
     "url": "https://www.tandfonline.com/doi/full/10.1080/13543784.2016.1240785"
   },
@@ -99,7 +99,7 @@
       "Luciana Borio"
     ],
     "doi": "10.1128/microbiolspec.EI10-0014-2016",
-    "date": "2016-05-06",
     "item_type": "journalArticle",
     "url": "https://journals.asm.org/doi/10.1128/microbiolspec.EI10-0014-2016"
   },
@@ -117,7 +117,7 @@
       "Larry Zeitlin"
     ],
     "doi": "10.3233/HAB-150284",
-    "date": "2015-12-23",
     "item_type": "journalArticle",
     "url": "https://www.medra.org/servlet/aliasResolver?alias=iospress&doi=10.3233/HAB-150284"
   },
@@ -130,7 +130,7 @@
       "Olivier Garraud"
     ],
     "doi": "10.1016/j.transci.2016.12.014",
-    "date": "02/2017",
     "item_type": "journalArticle",
     "url": "https://linkinghub.elsevier.com/retrieve/pii/S1473050216302002"
   },
@@ -144,7 +144,7 @@
       "K Karunamoorthi"
     ],
     "doi": "",
-    "date": "",
     "item_type": "journalArticle",
     "url": ""
   },
@@ -162,7 +162,7 @@
       "Larry Zeitlin"
     ],
     "doi": "10.3233/HAB-150284",
-    "date": "2015-12-23",
     "item_type": "journalArticle",
     "url": ""
   },
@@ -176,7 +176,7 @@
       "Aaron A. R. Tobian"
     ],
     "doi": "10.1111/trf.12913",
-    "date": "2014-12",
     "item_type": "journalArticle",
     "url": ""
   },
@@ -194,7 +194,7 @@
       "Robert L. Gottlieb"
     ],
     "doi": "10.1038/s41577-021-00542-x",
-    "date": "2021-06",
     "item_type": "journalArticle",
     "url": ""
   },
@@ -210,7 +210,7 @@
       "Marco Tuccori"
     ],
     "doi": "10.1128/CMR.00072-20",
-    "date": "2020-09-16",
     "item_type": "journalArticle",
     "url": ""
   },
@@ -223,7 +223,7 @@
       "Olivier Garraud"
     ],
     "doi": "10.1016/j.transci.2016.12.014",
-    "date": "2017-02",
     "item_type": "journalArticle",
     "url": ""
   },
@@ -237,7 +237,7 @@
       "Luciana Borio"
     ],
     "doi": "10.1128/microbiolspec.EI10-0014-2016",
-    "date": "2016-06",
     "item_type": "journalArticle",
     "url": ""
   },
@@ -257,7 +257,7 @@
       "Xiangguo Qiu"
     ],
     "doi": "10.1016/j.molmed.2017.07.002",
-    "date": "2017-09",
     "item_type": "journalArticle",
     "url": ""
   },
@@ -274,7 +274,7 @@
       "Sina Bavari"
     ],
     "doi": "10.1146/annurev-pharmtox-010716-105055",
-    "date": "2017-01-06",
     "item_type": "journalArticle",
     "url": ""
   }

       "Marco Tuccori"
     ],
     "doi": "",
+    "year": null,
     "item_type": "journalArticle",
     "url": ""
   },
       "Sina Bavari"
     ],
     "doi": "10.1146/annurev-pharmtox-010716-105055",
+    "year": null,
     "item_type": "journalArticle",
     "url": "https://www.annualreviews.org/doi/10.1146/annurev-pharmtox-010716-105055"
   },
       "Xiangguo Qiu"
     ],
     "doi": "10.1016/j.molmed.2017.07.002",
+    "year": null,
     "item_type": "journalArticle",
     "url": "https://linkinghub.elsevier.com/retrieve/pii/S1471491417301090"
   },
       "Robert L. Gottlieb"
     ],
     "doi": "10.1038/s41577-021-00542-x",
+    "year": null,
     "item_type": "journalArticle",
     "url": "https://www.nature.com/articles/s41577-021-00542-x"
   },
       "M. P. Grobusch"
     ],
     "doi": "10.1080/13543784.2016.1240785",
+    "year": null,
     "item_type": "journalArticle",
     "url": "https://www.tandfonline.com/doi/full/10.1080/13543784.2016.1240785"
   },
       "Luciana Borio"
     ],
     "doi": "10.1128/microbiolspec.EI10-0014-2016",
+    "year": null,
     "item_type": "journalArticle",
     "url": "https://journals.asm.org/doi/10.1128/microbiolspec.EI10-0014-2016"
   },
       "Larry Zeitlin"
     ],
     "doi": "10.3233/HAB-150284",
+    "year": null,
     "item_type": "journalArticle",
     "url": "https://www.medra.org/servlet/aliasResolver?alias=iospress&doi=10.3233/HAB-150284"
   },
       "Olivier Garraud"
     ],
     "doi": "10.1016/j.transci.2016.12.014",
+    "year": null,
     "item_type": "journalArticle",
     "url": "https://linkinghub.elsevier.com/retrieve/pii/S1473050216302002"
   },
       "K Karunamoorthi"
     ],
     "doi": "",
+    "year": null,
     "item_type": "journalArticle",
     "url": ""
   },
       "Larry Zeitlin"
     ],
     "doi": "10.3233/HAB-150284",
+    "year": null,
     "item_type": "journalArticle",
     "url": ""
   },
       "Aaron A. R. Tobian"
     ],
     "doi": "10.1111/trf.12913",
+    "year": null,
     "item_type": "journalArticle",
     "url": ""
   },
       "Robert L. Gottlieb"
     ],
     "doi": "10.1038/s41577-021-00542-x",
+    "year": null,
     "item_type": "journalArticle",
     "url": ""
   },
       "Marco Tuccori"
     ],
     "doi": "10.1128/CMR.00072-20",
+    "year": null,
     "item_type": "journalArticle",
     "url": ""
   },
       "Olivier Garraud"
     ],
     "doi": "10.1016/j.transci.2016.12.014",
+    "year": null,
     "item_type": "journalArticle",
     "url": ""
   },
       "Luciana Borio"
     ],
     "doi": "10.1128/microbiolspec.EI10-0014-2016",
+    "year": null,
     "item_type": "journalArticle",
     "url": ""
   },
       "Xiangguo Qiu"
     ],
     "doi": "10.1016/j.molmed.2017.07.002",
+    "year": null,
     "item_type": "journalArticle",
     "url": ""
   },
       "Sina Bavari"
     ],
     "doi": "10.1146/annurev-pharmtox-010716-105055",
+    "year": null,
     "item_type": "journalArticle",
     "url": ""
   }

data/ebscohost_zotero_items.json DELETED Viewed

The diff for this file is too large to render. See raw diff

data/exportedris-file-1-of-1-1_zotero_items.json DELETED Viewed

@@ -1,813 +0,0 @@
-[
-  {
-    "key": "B4DGMAWK",
-    "title": "Afghanistan Safety Nets Evaluation",
-    "abstract": "The primary objective of this evaluation is to estimate the causal impact of an unconditional cash transfer on the ability of the poorest families in select districts in Afghanistan to smooth consumption during seasonal shocks (e.g., winter-related, agricultural, and water shocks). Secondarily, the study will assess intervention effects on other economic outcomes, ownership and preservation of assets, child wellbeing (including nutrition, education, and refrainment from labor), migration, psychological well-being, and confidence in institutions. The target population consists of the poorest quintile of families with children under the age of five. Unconditional cash transfers will be provided to poor families in three installments: before, at the beginning, and at the end of the lean season. The annual benefit will amount to approximately 8,500 AFN (125 USD) for families with one more child under five; each payment installment is of equal amount.",
-    "full_text": "",
-    "authors": [
-      "Matthew Morton",
-      "Lucian Bucur Pop"
-    ],
-    "doi": "",
-    "year": null,
-    "item_type": "journalArticle",
-    "url": "https://ridie.3ieimpact.org/index.php?r=search/detailView&id=404"
-  },
-  {
-    "key": "P2VD3QWB",
-    "title": "Financial Education and Financial Access for Transnational Households: Field Experimental Evidence from the Philippines",
-    "abstract": "We implemented a randomized controlled trial among transnational households in the Philippines estimating impacts of a financial education treatment, a financial access treatment, and the combination of the two on financial behaviors. We test whether there are complementarities between both interventions and provide insight into the nature of constraints operating in financial services markets. We find no evidence of complementarities between the financial education and access treatments. In addition, while we find no evidence of constraints in access to formal credit and savings products, our results suggest that access constraints exist in the formal insurance market. Impacts on other financial behaviors are suggestive of the importance of information constraints in financial decision-making. These results provide guidance to designers of financial interventions in similar populations.",
-    "full_text": "",
-    "authors": [
-      "Abarcar P",
-      "Barua R",
-      "Yang D"
-    ],
-    "doi": "10.1086/703045",
-    "year": null,
-    "item_type": "journalArticle",
-    "url": ""
-  },
-  {
-    "key": "QD6ZPX6I",
-    "title": "Labor Supply Responses to Large Social Transfers: Longitudinal Evidence from South Africa",
-    "abstract": "We quantify the labor supply responses of prime-aged adults to the presence of pensioners in their households, using longitudinal data collected in South Africa. We compare households and individuals before and after pension receipt and pension loss, which allows us to control for a host of unobservable household and individual characteristics that may determine labor market behavior. We,find large cash transfers to the elderly lead to increased employment among prime-aged adults, which occurs primarily through labor migration. The pension's impact is attributable to the increase in household resources it represents, which can be used to stake migrants until they become self-sufficient, and to the presence of pensioners who can care for small children, which allows prime-aged adults to look for work elsewhere. (JEL H23, H55, I38, J22, O15)",
-    "full_text": "",
-    "authors": [
-      "Ardington C",
-      "Case A",
-      "Hosegood V"
-    ],
-    "doi": "10.1257/app.1.1.22",
-    "year": null,
-    "item_type": "journalArticle",
-    "url": ""
-  },
-  {
-    "key": "VUJDLBR5",
-    "title": "Aid programs' unintended effects: The case of Progresa and migration",
-    "abstract": "This paper analyzes the effect of aid on international and domestic migration and explores the causal effect of income on migration. The theoretical model predicts that the effect of aid \u2026",
-    "full_text": "",
-    "authors": [
-      "Angelucci M"
-    ],
-    "doi": "",
-    "year": null,
-    "item_type": "journalArticle",
-    "url": "https://papers.ssrn.com/sol3/papers.cfm?abstract_id=868646"
-  },
-  {
-    "key": "29J6T354",
-    "title": "Information, Intermediaries, and International Migration",
-    "abstract": "Job seekers face substantial information frictions, especially in international labor markets where intermediaries match prospective migrants with overseas employers. We conducted a randomized trial in Indonesia to explore how information about intermediary quality shapes migration outcomes. Holding access to information about the return to choosing a high-quality intermediary constant, intermediary-specific quality disclosure reduces the migration rate, cutting use of low-quality providers. Workers who do migrate receive better pre-departure preparation and have improved experiences abroad, despite no change in occupation or destination. These results are not driven by changes in beliefs about average provider quality or the return to migration. Nor does selection explain improved outcomes for those who migrate with quality disclosure. Together, our findings are consistent with an increase in the option value of search: with better ability to differentiate offer quality, workers search longer, select higher-quality intermediaries, and ultimately have better migration experiences.",
-    "full_text": "",
-    "authors": [
-      "Bazzi Samuel",
-      "Cameron Lisa",
-      "Schaner Simone",
-      "Witoelar Firman"
-    ],
-    "doi": "",
-    "year": null,
-    "item_type": "journalArticle",
-    "url": ""
-  },
-  {
-    "key": "YIL3BQE5",
-    "title": "An Adaptive Targeted Field Experiment: Job Search Assistance for Refugees in Jordan",
-    "abstract": "We introduce an adaptive targeted treatment assignment methodology for field experiments. Our Tempered Thompson Algorithm balances the goals of maximizing the precision of treatment effect estimates and maximizing the welfare of experimental participants. A hierarchical Bayesian model allows us to adaptively target treatments. We implement our methodology in Jordan, testing policies to help Syrian refugees and local jobseekers to find work. The immediate employment impacts of a small cash grant, information and psychological support are small, but targeting raises employment by 1 percentage-point (20%). After four months, cash has a sizable effect on employment and earnings of Syrians.",
-    "full_text": "",
-    "authors": [
-      "Caria Stefano",
-      "Gordon Grant",
-      "Kasy Maximilian",
-      "Quinn Simon",
-      "Shami Soha",
-      "Teytelboym Alexander"
-    ],
-    "doi": "",
-    "year": null,
-    "item_type": "journalArticle",
-    "url": ""
-  },
-  {
-    "key": "JINCDGIG",
-    "title": "Social Protection and Labor Market Outcomes of Youth in South Africa",
-    "abstract": "An Apartheid-driven spatial mismatch between workers and jobs leads to high job search costs for people living in rural areas of South Africa--costs that many young people cannot pay. In this article, the authors examine whether the arrival of a social grant--specifically a generous state-funded old-age pension given to men and women above prime age--enhances the ability of young men in rural areas to seek better work opportunities elsewhere. Based on eight waves of socioeconomic data on household living arrangements and household members' characteristics and employment status, collected between 2001 and 2011 at a demographic surveillance site in KwaZulu-Natal, the authors find that young men are significantly more likely to become labor migrants when someone in their household becomes age-eligible for the old-age pension. But this effect applies only to those who have completed high school (matric), who are on average 8 percentage points more likely to migrate for work when their households become pension eligible, compared with other potential labor migrants. The authors also find that, upon pension loss, it is the youngest migrants who are the most likely to return to their sending households, perhaps because they are the least likely to be self-sufficient at the time the pension is lost. The evidence is consistent with binding credit constraints limiting young men from poorer households from seeking more lucrative work elsewhere.",
-    "full_text": "",
-    "authors": [
-      "Ardington Cally",
-      "Barnighausen Till",
-      "Case Anne",
-      "Menendez Alicia"
-    ],
-    "doi": "",
-    "year": null,
-    "item_type": "journalArticle",
-    "url": ""
-  },
-  {
-    "key": "F3ZV6MYR",
-    "title": "Unilateral Facilitation Does Not Raise International Labor Migration From The Philippines",
-    "abstract": "Significant income gains from migrating from poorer to richer countries have motivated unilateral (source-country) policies facilitating labor emigration. However, their effectiveness is unknown. We conducted a large-scale randomized experiment in the Philippines testing the impact of unilaterally facilitating international labor migration. Our most intensive treatment doubled the rate of job offers but had no identifiable effect on international labor migration. Even the highest overseas job-search rate we induced (22%), falls far short of the share initially expressing interest in migrating (34%). We conclude that unilateral migration facilitation will at most induce a trickle, not a flood, of additional emigration.",
-    "full_text": "",
-    "authors": [
-      "Beam Emily A",
-      "Mckenzie David",
-      "Yang Dean"
-    ],
-    "doi": "10.1086/683999",
-    "year": null,
-    "item_type": "journalArticle",
-    "url": "https://www.journals.uchicago.edu/doi/10.1086/683999"
-  },
-  {
-    "key": "7CUVDKRR",
-    "title": "Long-term impacts of the oportunidades conditional cash transfer program on rural youth in Mexico",
-    "abstract": "This paper studies the long-term effects of partici pation in the Mexican Oportunidades program on a\nvariety of outcomes and behaviors of rural youth in\nMexico. It analyzes data from a social experiment,\nwhich randomly phased-in the program in rural Mex ican villages. In 1997, 320 villages (the treatment\ngroup) were randomly selected for early incorpora tion into the program and 186 villages (the control\ngroup) were designated as a control group to be in corporated eighteen months later. This paper ex amines whether differential exposure to the program\nsignificantly impacted educational attainment, labor\nmarket outcomes, marriage, migration and cognitive\nachievement of youth. The results show positive im pacts of longer exposure on grades of schooling at tained, but no effects on achievement tests. With\nrespect to work, we find an overall reduction in work\nfor male youth.",
-    "full_text": "",
-    "authors": [
-      "Behrman J R",
-      "Parker S W",
-      "Todd P E"
-    ],
-    "doi": "",
-    "year": null,
-    "item_type": "journalArticle",
-    "url": ""
-  },
-  {
-    "key": "PKYZCRJU",
-    "title": "Climate and Resilience Impact Evaluation Window: Experimental Evidence from Several Countries",
-    "abstract": "The concept of resilience has gained attention because it recognises the importance of addressing shorter-term humanitarian needs while simultaneously supporting communities to face future crises induced by climate change, conflict, and other factors. Many institutions, including the World Food Programme (WFP), have increasingly used the concept as a basis for their programming. WFP's integrated packages of interventions aim to improve food security and nutrition by smoothing food consumption in the short-term, while supporting livelihoods and addressing barriers to development (e.g., better climate information, access to markets, education, WASH, etc.) in the long-term. While all programme activities are potentially important for building resilience, livelihood activities are clearly connected to both immediate and future wellbeing. These activities include cash or in-kind transfers to the household and support for creating assets that could benefit the household or the community in the future. Therefore, livelihood activities have the potential to support households in improving and maintaining their wellbeing when facing future shocks and stressors. This pre-analysis plan describes policy experiments to estimate the impacts of experimentally varying WFP's activities on resilience as measured by community and household wellbeing. This approach follows others in conceptualizing resilience through changes in wellbeing (Knippenberg et al, 2019, Phadera et al. 2019, Jones and Tanner, 2017; Barrett et al, 2020). We design and run these experiments in the context of livelihoods programs implemented by the World Food Programme (WFP) across 6 countries. Beyond testing the overall impact of livelihood activities on wellbeing, a key ambition of this paper is to investigate whether activities themselves can be timed to accommodate households? vulnerability to seasonal fluctuations and shocks that are often connected to weather patterns and agricultural cycle. We identify two such mechanisms: adjusting the timing of cash transfers and labor requirements; and/or allowing for re-targeting participants over time to account for changes in vulnerability status.",
-    "full_text": "",
-    "authors": [],
-    "doi": "10.1257/rct.6851-3.1",
-    "year": null,
-    "item_type": "journalArticle",
-    "url": "https://www.socialscienceregistry.org/trials/6851"
-  },
-  {
-    "key": "IDE53VC5",
-    "title": "Migration policy: did an emergency provision displace standard rules? Evidence from Italy",
-    "abstract": "In 2011, to manage the exceptional flow of people escaping North Africa, the Italian government released the North Africa Emergency (Emergenza Nord Africa, ENA) provision, temporarily relaxing migration policies for some categories of asylum seekers. Using data from an important charity, we perform baseline difference-in-differences regressions to investigate the impact of this emergency rule on the probability of migrants regularizing their legal status. We exploit the timing of the enactment of the ENA accessibility criteriasuch that potential beneficiaries learned of its existence only after the realization of the state of entitlementto identify the effects of the emergency policy provision on treated and control groups of immigrants. The results show an increased number of successful applications in favor of eligible individuals, although a dramatic boost in the denial rate for other migrants is also observed. This suggests either that some migrants suffered displacement due to the emergency rule, and/or that improper submissions of ENA-oriented applications have occurred. We extend our analysis to the use of multilevel models to shed light on these possible (non-mutually excludable) explanations. Results seem to support the presence of some rule-displacement effects, although the existence of a set of wrongful submissions cannot be excluded. We discuss these possibilities from a policy perspective.",
-    "full_text": "",
-    "authors": [
-      "dalla Pellegrina L",
-      "Saraceno M",
-      "Suardi M"
-    ],
-    "doi": "10.1007/s40888-018-0128-0",
-    "year": null,
-    "item_type": "journalArticle",
-    "url": ""
-  },
-  {
-    "key": "44ICCPGX",
-    "title": "Does the Role Model Encourage Female Labor Force Participation? Field Experiment in Bangladesh",
-    "abstract": "Enhancing female labor force participation is considered key to economic growth, poverty alleviation, and women?s empowerment. Despite its importance both at the national and household/individual levels, the female labor force participation rate remains low in South Asian countries. It has been a great interest for researchers and policy makers how to enhance female labor force participation in these countries. We investigate whether providing unmarried young women and their parents with information about working conditions through the role model working women encourages unmarried young women?s labor force participation in rural Bangladesh, and if so, how. For this objective, we conduct the randomized controlled trial.",
-    "full_text": "",
-    "authors": [],
-    "doi": "10.1257/rct.4940-2.0",
-    "year": null,
-    "item_type": "journalArticle",
-    "url": "https://www.socialscienceregistry.org/trials/4940"
-  },
-  {
-    "key": "AEMAYDTW",
-    "title": "Managing the impact of climate on migration: Evidence from Mexico",
-    "abstract": "Although there is a growing literature on the impact of climate and weather-related events on migration, little is known about the mitigating effect of policies directed toward the agricultural sector, or aimed at insuring against environmental disasters. This paper uses state-level data on migration flows between Mexico and the USA from 1999 to 2012 to investigate the mitigating impact of an agricultural cash transfer program (PROCAMPO) and a disaster fund (Fonden) on the migration response to weather shocks. We find that Fonden decreases migration in response to heavy rainfall, hurricanes and droughts. Increases in PROCAMPO amounts paid to small producers play a more ambiguous role in the migration response to shocks. Changes in the distribution of PROCAMPO payments favoring more vulnerable producers in the non-irrigated ejido sector, however, seem to mitigate the impact of droughts on migration.",
-    "full_text": "",
-    "authors": [
-      "Chort I",
-      "Rupelle M de La"
-    ],
-    "doi": "10.1007/s00148-022-00894-1",
-    "year": null,
-    "item_type": "journalArticle",
-    "url": "https://link.springer.com/article/10.1007/s00148-022-00894-1"
-  },
-  {
-    "key": "74WHPTAN",
-    "title": "Impact assessment of the Migrant Resource Centres in the Silk Routes Region",
-    "abstract": "Executive summary Several Migrant Resource Centres (MRCs) have been set up in recent years jointly by national administrations of origin and destination countries and the \u2026",
-    "full_text": "",
-    "authors": [
-      "Dennison J"
-    ],
-    "doi": "",
-    "year": null,
-    "item_type": "journalArticle",
-    "url": "https://www.budapestprocess.org/wp-content/uploads/2022/12/ICMPD_MRC_impact_assessment_2022.pdf"
-  },
-  {
-    "key": "EYAF27EQ",
-    "title": "Employment and Irregular Migration: Evidence from Two Randomized Controlled Trials in Egypt",
-    "abstract": "Addressing the root causes of irregular migration has become a key policy priority in Europe. The EU Emergency Trust Fund for Africa (EUTF) was launched in 2015 with a budget of 5 billion euros to support projects aiming at deterring irregular migration flows from 26 origin countries. One of these projects is implemented by the Egyptian Micro, Small and Medium Enterprises Development Agency (MSMEDA) and targets unemployed youth in areas with the highest outflows of irregular migrants. We implement two randomized evaluations to assess whether (i) cash-for-work opportunities, and (ii) training and employment support have the intended effects on the direct beneficiaries and their relatives (household decision-maker, other household members, children, and friends). We assess impacts on people?s preferences and attitudes towards migration, irregular migration, as well as changes in their situation, aspirations, and expectations.",
-    "full_text": "",
-    "authors": [],
-    "doi": "10.1257/rct.10604-1.0",
-    "year": null,
-    "item_type": "journalArticle",
-    "url": "https://www.socialscienceregistry.org/trials/10604"
-  },
-  {
-    "key": "BBGCWFN6",
-    "title": "Enhancing Female Entrepreneurship through Cash Grants: Experimental Evidence from Rural Tunisia",
-    "abstract": "This research is a product of the World Bank's Middle East and North Africa Gender Innovation Lab (MNAGIL), which conducts rigorous impact evaluations and inferential \u2026",
-    "full_text": "",
-    "authors": [
-      "Zineb SB"
-    ],
-    "doi": "",
-    "year": null,
-    "item_type": "journalArticle",
-    "url": "https://ericmvukiyehe.com/wp-content/uploads/2021/08/3-Enhancing-Female-Entrepreneurship-through-Cash-Grants-Experimental-Evidence-from-Rural-Tunisia-1.pdf"
-  },
-  {
-    "key": "LU7SCHNY",
-    "title": "Estimating the Impacts of Volunteer vs. Paraprofessional Community Worker Interventions among Conditional Cash Transfer Recipients in the Dominican Republic",
-    "abstract": "This project seeks to estimate the impacts of providing social intermediation services to poor recipients of conditional cash transfers (CCT) in the Dominican Republic (DR). Employing a randomized control trial design, the project will randomly assign either i) referred volunteer, ii) publicly-recruited volunteer, or iii) university-recruited paid paraprofessional \"community workers\" to provide monthly visits to newly enrolled and existing CCT beneficiaries. Households in one arm of the study will only receive cash transfers and will not receive home visits by community workers and an additional arm will include households that are pure controls. Key outcomes of interest include beneficiaries' compliance with program conditionalities, household consumption, primary and secondary school attendance, use of health and other local public services, participation in vocational training, labor market participation, and knowledge of the wellness curriculum administered during the monthly household visits. Data on these key outcomes will be collected both administratively by the DR government and through conducting midline and endline household surveys. In addition to estimating impacts on beneficiary households, the project is designed to estimate the impacts of the community worker employment experience on community worker candidates themselves in terms of their own income, political and community engagement, leadership activities, and subjective wellbeing. Specifically, volunteer and paid employment offers will be randomly offered among those community worker candidates screened into the selection process.",
-    "full_text": "",
-    "authors": [],
-    "doi": "10.1257/rct.1778-1.0",
-    "year": null,
-    "item_type": "journalArticle",
-    "url": "https://www.socialscienceregistry.org/trials/1778"
-  },
-  {
-    "key": "CDAYBE26",
-    "title": "Evaluation of a Program for the Professionalization of Artisans (ProfArts) in Ghana",
-    "abstract": "Training and professionalization interventions are an important vehicle for economic support within the development assistance landscape. Yet rigorous quantitative impact evaluations of such programs remain scarce, especially in developing countries. In order to help fill this research gap, we will conduct a rigorous impact evaluation of a program for the Professionalization of Artisans (ProfArts) in Ghana. The program will deliver top-up training, licensing, certification, and related benefits to up to 10,000 artisans drawn from the Ghanaian construction sector, with beneficiaries to be randomly selected from up to 20,000 baseline respondents. In a first step, we examine the effects of randomly assigned recruitment content on application rates, the composition of the applicant pool, and downstream program outcomes. In a second step, we use a randomized controlled trial to estimate effects of the program on four groups of outcomes: (i) employment, measured e.g. in terms of job retention, acquisition and lengths of employment spells, (ii) job quality and quality of life, including e.g. earnings and workplace conditions, (iii) mobility, e.g. migration intentions and behaviors, and (iv) firm-level outcomes, e.g. firm performance and employment.",
-    "full_text": "",
-    "authors": [],
-    "doi": "10.1257/rct.6842-1.0",
-    "year": null,
-    "item_type": "journalArticle",
-    "url": "https://www.socialscienceregistry.org/trials/6842"
-  },
-  {
-    "key": "QMSMF872",
-    "title": "Evaluation of the Network for Enterprise Development Learning through Sewing for Girls (N4G) training program for young women in Ghana",
-    "abstract": "Skills trainings are often a central component of contemporary development assistance strategies, but much of the evidence base for their efficacy comes from high-income countries. RCTs in developing countries are still far less numerous. We contribute to this literature with a rigorous impact evaluation of a program for the empowerment and education of young women in Ghana, called Network for Enterprise Development Learning through Sewing for Girls (N4G). The program will deliver fashion-industry related training and empowerment programs to up to 1,000 underprivileged Ghanaian young women from both urban and rural areas. Beneficiaries are randomly selected from approximately 2,000 baseline respondents. We use a randomized controlled trial to estimate effects of the N4G program on four groups of outcomes: (i) employment, measured for example in terms of employment status, job acquisition, and lengths of employment spells, (ii) job quality, including earnings, having a contract or an oral agreement, job satisfaction, and workplace conditions among others, (iii) quality of life, covering indicators of the current living situation, household assets, and financial dependency, and (iv) mobility, e.g. migration intentions and behaviors.",
-    "full_text": "",
-    "authors": [],
-    "doi": "10.1257/rct.7967-1.0",
-    "year": null,
-    "item_type": "journalArticle",
-    "url": "https://www.socialscienceregistry.org/trials/7967"
-  },
-  {
-    "key": "2WUKVSZA",
-    "title": "The Impact of Tourist Visas on Intercontinental South-South Migration: Ecuador\u2019s Policy of \u201cOpen Doors\u201d as a Quasi-Experiment",
-    "abstract": "Through the implementation of universal visa freedom from 2008 to 2010, Ecuador became one of the most accessible countries in the world. This article employs mixed methods to study the impact of the de facto opening of Ecuador\u2019s borders on intercontinental south-south migration. First, we use a difference-in-difference design to show that Ecuador\u2019s policy of universal visa freedom led to a significant increase of immigration from previously restricted nationalities in Africa, Asia, and the Caribbean. Complementary descriptive statistics and qualitative findings confirm the decisive impact visa freedom had on intercontinental south-south migration and suggest three main motives: taking advantage of Ecuador\u2019s open doors as an exit option from origin countries, settlement in Ecuador based on relatively improved opportunities, and transmigration to third countries. Our findings imply that travel visa policies of southern countries significantly impact which new south-south flows emerge. \u00a9 The Author(s) 2018.",
-    "full_text": "",
-    "authors": [
-      "Freier L F",
-      "Holloway K"
-    ],
-    "doi": "10.1177/0197918318801068",
-    "year": null,
-    "item_type": "journalArticle",
-    "url": "https://www.scopus.com/inward/record.uri?eid=2-s2.0-85059900710&doi=10.1177%2f0197918318801068&partnerID=40&md5=60533a0c145229926d2e61b312680c19"
-  },
-  {
-    "key": "YK492G5P",
-    "title": "The REFANI Pakistan study\u2014a cluster randomised controlled trial of the effectiveness and cost-effectiveness of cash-based transfer programmes on child nutrition status: study protocol",
-    "abstract": "Cash-based transfer programmes are an emerging strategy in the prevention of wasting in children, especially targeted at vulnerable households during periods of food insecurity or during emergencies. However, the evidence surrounding the use of either cash or voucher transfer programmes in the humanitarian context and on nutritional outcomes is elusive. More evidence is needed not only to inform the global community of practice on best practices in humanitarian settings, but also to help strengthen national mitigation responses. Methods/Design The Research for Food Assistance on Nutrition Impact Pakistan study (REFANI-P) sets out to evaluate the impact of three cash-based interventions on nutritional outcomes in children aged less than five years from poor and very poor households in Dadu District. This four-arm parallel cluster randomised controlled trial is set among Action Against Hunger (ACF) programme villages in Dadu District, Sindh Province. Mothers are the target recipients of either seasonal unconditional cash transfers or fresh food vouchers. A comparison group receives \u2018standard care\u2019 provided by the ACF programme to which all groups have the same access. The primary outcomes are prevalence of wasting and mean weight-for-height Z-score (WHZ) in children. Impact will be assessed at 6 months and at 1 year from baseline. Using a theory-based approach we will determine \u2018how\u2019 the different interventions work by looking at the processes involved and the impact pathways following the theory of change developed for this context. Quantitative and qualitative data are collected on morbidity, health seeking, hygiene and nutrition behaviours, dietary diversity, haemoglobin concentration, women\u2019s empowerment, household food security and expenditures and social capital. The direct and indirect costs of each intervention borne by the implementing organisation and their partners as well as by beneficiaries and their communities are also assessed. Discussion The results of this trial will provide robust evidence to help increase knowledge about the predictability of how different modalities of cash-based transfer work best to reduce the risk of child wasting during a season where food insecurity is at its highest. Evidence on costing and cost-effectiveness will further aid decisions on choice of modality in terms of effectiveness and sustainability.",
-    "full_text": "",
-    "authors": [
-      "Fenn et al"
-    ],
-    "doi": "10.1186/s12889-015-2380-3",
-    "year": null,
-    "item_type": "journalArticle",
-    "url": "https://bmcpublichealth.biomedcentral.com/articles/10.1186/s12889-015-2380-3"
-  },
-  {
-    "key": "4WXF37WF",
-    "title": "How Overseas Opportunities Shape Political Preferences: A Field Experiment on International Migration",
-    "abstract": "This paper demonstrates that access to overseas employment reduces support for taxation and redistribution by bolstering individuals\u2019 economic prospects. We present results from the \ufb01rst randomized controlled trial to result in international migration. Individuals who received the opportunity to migrate from India to the Middle East for work reported signi\ufb01cantly higher wages, greater economic con\ufb01dence, and more \ufb01scally conservative attitudes. Moreover, the program had lasting effects even for those who decided not to migrate, which we link to improved exit options. Our results speak to longstanding debates about the impact of globalization on economic development and welfare state politics.",
-    "full_text": "",
-    "authors": [
-      "Gaikwad N",
-      "Hanson K",
-      "Toth A"
-    ],
-    "doi": "",
-    "year": null,
-    "item_type": "journalArticle",
-    "url": "https://papers.ssrn.com/sol3/papers.cfm?abstract_id=3816464"
-  },
-  {
-    "key": "68ATB2KG",
-    "title": "How Migrant Resource Centres affect migration decisions: Quasi-experimental evidence from Afghanistan, Bangladesh, Iraq and Pakistan",
-    "abstract": "Several Migrant Resource Centres (MRCs) have been set up in South Asia jointly by national governments of origin and destination countries. Their objectives include encouragement of potential migrants to seek regular rather than irregular routes and to ensure the safety of those migrating, regardless of status. Of theoretical note, their activities utilise innovative, highly personalised counselling. This article provides quasi-experimental evidence of the effect of four activities - telephone and online counselling, and college outreach and pre-departure sessions - on 2215 randomly allocated users of the MRCs' services across six MRCs in four countries: Afghanistan, Bangladesh, Iraq and Pakistan. The effects are a large reduction in self-reported likelihood of migrating irregularly, and a strong increase in awareness of safe options and who to contact for assistance whilst migrating. The effects are consistent across activity type and MRC location, although magnitudes vary. These findings have implications for our understanding of how the decision to migrate is made, what interventions are effective and why.",
-    "full_text": "",
-    "authors": [
-      "Dennison J"
-    ],
-    "doi": "10.1111/imig.13082",
-    "year": null,
-    "item_type": "journalArticle",
-    "url": ""
-  },
-  {
-    "key": "9YRUKMA5",
-    "title": "The Apprenticeship-to-Work Transition : Experimental Evidence from Ghana",
-    "abstract": "This paper examines the effects of a government-sponsored apprenticeship training program designed to address high levels of youth unemployment in Ghana. The study exploits randomized access to the program to examine the short-run effects of apprenticeship training on labor market outcomes. The results show that apprenticeships shift youth out of wage work and into self-employment. However, the loss of wage income is not offset by increases in self-employment profits in the short run. In addition, the study uses the randomized match between apprentices and training providers to examine the causal effect of characteristics of trainers on outcomes for apprentices. Participants who trained with the most experienced trainers or the most profitable ones had higher earnings. These increases more than offset the program's negative treatment effect on earnings. This suggests that training programs can be made more effective through better recruitment of trainers.",
-    "full_text": "",
-    "authors": [
-      "Hardy Morgan L",
-      "Mbiti Isaac Mulangu",
-      "Mccasland Jamie Lee",
-      "Salcher Isabelle"
-    ],
-    "doi": "",
-    "year": null,
-    "item_type": "journalArticle",
-    "url": "https://www.proquest.com/working-papers/apprenticeship-work-transition-experimental/docview/2223061072/se-2 http://UnivofPretoria.on.worldcat.org/atoztitles/link?sid=ProQ:&issn=&volume=&issue=&title=IDEAS+Working+Paper+Series+from+RePEc&spage=&date=2019-01-01&atitle=The+Apprenticeship-to-Work+Transition+%3A+Experimental+Evidence+from+Ghana&au=Hardy%2C+Morgan+L%3BMbiti%2C+Isaac+Mulangu%3BMccasland%2C+Jamie+Lee%3BSalcher%2C+Isabelle&id=doi: https://ideas.repec.org/p/wbk/wbrwps/8851.html"
-  },
-  {
-    "key": "2YVH2MHU",
-    "title": "Get Rich or Die Tryin\u2019: Perceived Earnings, Perceived Mortality Rates, and Migration Decisions of Potential Work Migrants from Nepal",
-    "abstract": "This article reports on a randomized field experiment in which potential work migrants from Nepal to Malaysia and the Persian Gulf countries are provided with information on wages and mortality incidences at their intended destinations. It is found that, particularly for the group of potential migrants without prior foreign migration experience, the information changes their expectations of earnings and mortality risks abroad, which further changes their actual migration decisions. Using the exogenous variation in expectations, it is estimated that the elasticity of migration with respect to mortality rate expectation is 0.8, and the elasticity of migration with respect to earnings expectation is 1.1.",
-    "full_text": "",
-    "authors": [],
-    "doi": "",
-    "year": null,
-    "item_type": "journalArticle",
-    "url": ""
-  },
-  {
-    "key": "736V6NV8",
-    "title": "Harnessing the Development Benefits of International Migration: A Randomized Evaluation of Enhanced Pre-Departure Orientation Seminars for Migrants from the Philippines",
-    "abstract": "Pre-departure orientation seminars (PDOS) for migrants have the potential to become a key policy tool for increasing the benefits of migration. PDOS build on the fact that many migrants face important knowledge gaps with respect to various aspects of their destination country upon arrival. These knowledge gaps are particularly large for individuals who move from a developing to a developed country and have to navigate a completely different system. Many migrants may hence not be able to make optimal decisions, or only after costly learning. The principal idea of PDOS is to reduce these knowledge gaps early on and provide migrants with the right information to succeed abroad. There is currently no rigorous evidence on the effects of PDOS and on what kind of training modules matter. Using a randomized control trial, this project evaluates the effects of PDOS on migration outcomes of permanent migrants from the Philippines to the US. Together with the Commission on Filipinos Overseas (CFO), the key government agency tasked to manage permanent migration from the Philippines, we have developed new PDOS modules. The new PDOS aims to foster settlement and labor market integration and increase migrants? wellbeing more generally. It also aims to strengthen migrants? engagement in diaspora activities that contribute to development in the Philippines. We identify the effects of the new PDOS by randomly assigning migrants to different types of PDOS and tracking the impact on 1,273 migrants and their family members remaining in the Philippines over a period of two years after departure.",
-    "full_text": "",
-    "authors": [],
-    "doi": "10.1257/rct.1389-2.1",
-    "year": null,
-    "item_type": "journalArticle",
-    "url": "https://www.socialscienceregistry.org/trials/1389"
-  },
-  {
-    "key": "CNXHNZ6K",
-    "title": "Gender differences in the effects of vocational training: Constraints on women and drop-out behavior",
-    "abstract": "We provide experimental evidence on the effects of vocational and entrepreneurial training for Malawian youth, in an environment where access to schooling and formal sector employment is extremely low. We track a large fraction of program drop-outs \u2013 a common phenomenon in the training evaluation literature \u2013 and this allows us to examine the determinants and consequences of drop-out and how it mediates the effects of such programs. We find that women make decisions in a more constrained environment, and their participation affected by family obligations. Participation is more expensive for them, resulting in worse training experience. The training results in skills development, continued investment in human capital, and improved well-being, with more positive effects for men, but no improvements in labor market outcomes in the short run.",
-    "full_text": "",
-    "authors": [],
-    "doi": "10.1596/1813-9450-6545",
-    "year": null,
-    "item_type": "journalArticle",
-    "url": ""
-  },
-  {
-    "key": "P4QQT3NG",
-    "title": "Impacts of Targeted Covid-19 Cash Transfers in Togo",
-    "abstract": "In response to COVID-19, a third of social protection measures have taken the form of cash transfers reaching more than 1.1 billion people --- a 240% increase in coverage from pre-COVID levels. In the aftermath of the COVID-19 pandemic, direct cash transfers are an effective tool to protect vulnerable households. We conduct a randomized controlled trial (RCT) of a targeted cash transfer program implemented in rural Togo between November 2020 and May 2021. In collaboration with GiveDirectly, the government of Togo secured sufficient funding to provide benefits to roughly 57,000 of the approximately 580,000 citizens living in the poorest 100 cantons. Using mobile phone and satellite data, we identified the poorest cantons and poorest people living in them. We randomized the beneficiaries among the poorest phone owners. After registration, every month and for five months, eligible women receive a cash transfer of 8,620 F CFA ($15.5 US) and eligible men, a transfer of 7,450 F CFA ($13.5 US). We conduct a telephone survey at the end of the intervention to measure a wide range of outcomes, including consumption, food security, labor supply, access to health care, education, psychological well-being, financial inclusion and the perception of poverty. We also have access to administrative data of mobile phone companies in Togo, which will allow us to exploit phone usage behaviors and build other types of outcomes, such as adoption and use of the mobile money services, migration or predicted poverty.",
-    "full_text": "",
-    "authors": [],
-    "doi": "10.1257/rct.7590-1.1",
-    "year": null,
-    "item_type": "journalArticle",
-    "url": "https://www.socialscienceregistry.org/trials/7590"
-  },
-  {
-    "key": "VASWRVLM",
-    "title": "Information campaigns and migration perceptions: Evidence from Senegal",
-    "abstract": "The research studies the effect of information campaigns on irregular immigration on the intentions to migrate irregularly among high school students in Dakar. We analyze which actors and information content are effective the most in shaping students' intention to migrate and migration perceptions.",
-    "full_text": "",
-    "authors": [],
-    "doi": "10.1257/rct.8829-1.2",
-    "year": null,
-    "item_type": "journalArticle",
-    "url": "https://www.socialscienceregistry.org/trials/8829"
-  },
-  {
-    "key": "M9UMATUQ",
-    "title": "Information and Irregular Migration: Evidence from a Field Experiment in Nigeria",
-    "abstract": "Policy projections and recent research suggest that large numbers of irregular migrants from sub-Saharan Africa will continue to attempt to make their way to Europe over the next few decades. In response, European countries have made and continue to make significant investments in information campaigns designed to discourage irregular African migration. These campaigns are frequently accompanied by evaluations of some sort but, to our knowledge, none have involved a well-powered, randomized controlled trial with a representative sample and actual migration as an outcome. This pre-analysis plan describes the design of field experiment that addresses the following core questions: Are beliefs about migration-related risks, interest in attempting irregular migration, and actual migration decisions responsive to information campaigns highlighting the risks of the migration journey? The project takes place in Edo and Delta states, in the South-South region of Nigeria, a major Sub-Saharan African source of irregular migrants to Europe.",
-    "full_text": "",
-    "authors": [],
-    "doi": "10.1257/rct.8718-1.0",
-    "year": null,
-    "item_type": "journalArticle",
-    "url": "https://www.socialscienceregistry.org/trials/8718"
-  },
-  {
-    "key": "YFJ6ZQ94",
-    "title": "Informing Risky Migration: Evidence from a field experiment in Guinea",
-    "abstract": "Migrants from Western Africa go through risky migration routes to reach Europe. In addition, African migration to Europe often results in low economic outcomes. Potential migrants might be poorly informed about benefits and costs of migration. We then propose to use a Randomized Control Trial (RCT) to answer the following questions: (i) Are migrants are about their earning opportunities in Europe and risks connected to the journey? (ii) Can an intervention providing information about earnings and risks changes potential migrants? beliefs and so influences their migration choices?",
-    "full_text": "",
-    "authors": [],
-    "doi": "10.1257/rct.4062-1.1",
-    "year": null,
-    "item_type": "journalArticle",
-    "url": "https://www.socialscienceregistry.org/trials/4062"
-  },
-  {
-    "key": "ED6H9RXQ",
-    "title": "Micro-credit programs and off-farm migration in China",
-    "abstract": "This paper seeks to evaluate effects of micro-credit projects on the poor. We utilize data that we collected in Sichuan Province in 1999 to investigate whether micro-credit projects have targeted the poor and whether participation in the micro-credit project increases the likelihood of migration and switching to off-farm jobs. We find that, although the micro-credit programs did not help increase assets of the participants, it did help to move one or more of their members into an off-farm job. Our findings indicate that there is a great deal of benefit in supporting microcredit programs. \u00a9 2004 Blackwell Publishing Ltd.",
-    "full_text": "",
-    "authors": [
-      "Li H",
-      "Rozelle S",
-      "Zhang L"
-    ],
-    "doi": "10.1111/j.1468-0106.2004.00245.x",
-    "year": null,
-    "item_type": "journalArticle",
-    "url": "https://www.scopus.com/inward/record.uri?eid=2-s2.0-9744253083&doi=10.1111%2fj.1468-0106.2004.00245.x&partnerID=40&md5=f2a50ff821db79c4dfabfa1decc3b723"
-  },
-  {
-    "key": "I4MY83RJ",
-    "title": "Experimental long-term effects of early-childhood and school-age exposure to a conditional cash transfer program",
-    "abstract": "Numerous evaluations of conditional cash transfer (CCT) programs show positive short-term impacts, but there is only limited evidence on whether these benefits translate into sustained longer-term gains. This paper uses the municipal-level randomized assignment of a CCT program implemented for five years in Honduras to estimate long-term effects 13 years after the program began. We estimate intent-to-treat effects using individual-level data from the population census, which allows assignment of individuals to their municipality of birth, thereby circumventing migration selection concerns. For the non-indigenous, we find positive and robust impacts on educational outcomes for cohorts of a very wide age range. These include increases of more than 50 percent for secondary school completion rates and the probability of reaching university studies for those exposed at school-going ages. They also include substantive gains for grades attained and current enrollment for others exposed during early childhood, raising the possibility of further gains going forward. Educational gains are, however, more limited for the indigenous. Finally, exposure to the CCT increased the probability of international migration for young men, from 3 to 7 percentage points, also stronger for the non-indigenous. Both early childhood exposure to the nutrition and health components of the CCT as well as exposure during school-going ages to the educational components led to sustained increases in human capital. \u00a9 2019 The Authors",
-    "full_text": "",
-    "authors": [
-      "Molina Mill\u00e1n",
-      "T",
-      "Macours K",
-      "Maluccio J A",
-      "Tejerina L"
-    ],
-    "doi": "10.1016/j.jdeveco.2019.102385",
-    "year": null,
-    "item_type": "journalArticle",
-    "url": "https://www.scopus.com/inward/record.uri?eid=2-s2.0-85072577537&doi=10.1016%2fj.jdeveco.2019.102385&partnerID=40&md5=cbacf9b13921db5e8346649371e83718"
-  },
-  {
-    "key": "N6R57IVT",
-    "title": "Bilateral labor agreements and the migration of Filipinos: An instrumental variable approach",
-    "abstract": "Bilateral labor agreements (BLAs) are preferred policy models for regulating migration by many governments around the world. The Philippines has been a leader in both agreement conclusion and exporting labor. A recent Congressional evocation is pushing bureaucrats and academics alike to investigate this policy strategy for outcomes and effectiveness. The following analysis answers the question \"Do BLAs affect the migration outflows of Overseas Filipino Workers (OFWs)?\"using a plausibly exogenous variation to isolate a causal effect. I test for effects of BLAs using two instrumental variables (IVs), such as Bilateral Investment Treaties (BITs) and Formal Alliances, and an original dataset of land-based and sea-based Filipino BLAs and migrant stock in 213 unique areas from 1960 to 2018. I do not find any empirical evidence that these treaties drive migration. However, BLAs have statistically significant effects on gross domestic product (GDP) per capita and exports, suggesting other important channels through which these agreements affect economic outcomes. These null results are critically important for policymakers and diplomats because the resources spent on negotiation are wasted if the primary goal is to increase migration. \u00a9 2021 Brianna O'Steen, published by Sciendo.",
-    "full_text": "",
-    "authors": [
-      "O'Steen B"
-    ],
-    "doi": "10.2478/izajodm-2021-0011",
-    "year": null,
-    "item_type": "journalArticle",
-    "url": "https://www.scopus.com/inward/record.uri?eid=2-s2.0-85117392815&doi=10.2478%2fizajodm-2021-0011&partnerID=40&md5=4d168fa69f58fc0804c9b0a8a8fd3172"
-  },
-  {
-    "key": "64F7ET9X",
-    "title": "Children on the Move : Progressive Redistribution of Humanitarian Cash Transfers among Refugees",
-    "abstract": "This paper evaluates the impact of the Emergency Social Safety Net (ESSN) in Turkey, the largest cash transfer program for international refugees in the world. The paper provides prima facie evidence that the program quickly caused substantial changes in household size and composition, with a net movement of primarily school-age children from larger ineligible households to smaller eligible ones. A sharp decline in inequality is observed in the entire study population: the Gini index declined by four percentage points (or 15 percent) within six months of program rollout, and the poverty headcount at the $3.20/day international poverty line declined by more than 50 percent after one year. ESSN caused a moderate increase in the diversity and frequency of food consumption among eligible households, and although there was no statistically significant effect on overall school enrollment, there were meaningful gains among the most vulnerable beneficiary households. To strike the right balance between transfer size and coverage, key parameters in the design of any cash transfer program, policy makers should consider the possibility that refugee populations may respond to their eligibility status by altering their household structure and living arrangements.",
-    "full_text": "",
-    "authors": [
-      "Ozler Berk",
-      "Celik Cigdem",
-      "Cunningham Scott",
-      "Cuevas Pablo Facundo",
-      "Parisotto Luca"
-    ],
-    "doi": "",
-    "year": null,
-    "item_type": "journalArticle",
-    "url": "https://search.ebscohost.com/login.aspx?direct=true&db=edsrep&AN=edsrep.p.wbk.wbrwps.9471&site=eds-live"
-  },
-  {
-    "key": "82H99VKZ",
-    "title": "Do higher salaries lower physician migration?",
-    "abstract": "It is believed that low wages are an important reason why doctors and nurses in developing countries migrate, and this has led to a call for higher wages for health professionals in developing countries. In this paper, we provide some of the first estimates of the impact of raising health workers' salaries on migration. Using aggregate panel data on the stock of foreign doctors in 16 Organization for Economic Cooperation and Development countries, we explore the effect of a wage increase programme in Ghana on physician migration. We find evidence that 6 years after the implementation of this programme, the foreign stock of Ghanaian doctors abroad had fallen by approximately 10% relative to the estimated counterfactual. This result should be interpreted with caution, however, given the sensitivity of the results to changes in model specification. \u00a9 2013 The Author.",
-    "full_text": "",
-    "authors": [
-      "Okeke E N"
-    ],
-    "doi": "10.1093/heapol/czt046",
-    "year": null,
-    "item_type": "journalArticle",
-    "url": "https://www.scopus.com/inward/record.uri?eid=2-s2.0-84906064721&doi=10.1093%2fheapol%2fczt046&partnerID=40&md5=094f43a6ca58fdbf70d99377b4c2379c"
-  },
-  {
-    "key": "924DRNUJ",
-    "title": "Aid and Migration: An Analysis of the Impact of Progresa on the Timing and Size of Labour Migration",
-    "abstract": "This paper models the short and medium-run impact of aid on migration, considering alternatively the effect of nconditional and conditional cash transfers to financially constrained households. Data from the evaluation of a Mexican development program, Progresa, are used to estimate the effect of the potential grant size on migration. The empirical analysis is consistent with model prediction. It shows that the program is associated with an increase in international migration, which is also a positive function of size of potential transfer. The grant may loosen financial constraints. At the same time, fine-tuned conditional grants targeting prospective migrants (in the form of secondary school subsidies) reduce the short-term migration probability. As regards medium-term migration, secondary school beneficiaries are not more likely to migrate than the control group after they complete the subsidised education cycle.",
-    "full_text": "",
-    "authors": [
-      "Manuela Angelucci"
-    ],
-    "doi": "",
-    "year": null,
-    "item_type": "journalArticle",
-    "url": "https://docs.iza.org/dp1187.pdf"
-  },
-  {
-    "key": "UK8I5GM4",
-    "title": "Medical worker migration and origin-country human capital: Evidence from us visa policy",
-    "abstract": "We exploit changes in U.S. visa policies for nurses to measure the origin-country human capital response to international migration opportunities. Combining data on all migrant departures and postsecondary institutions in the Philippines, we show that nursing enrollment and graduation increased substantially in response to greater U.S. demand for nurses. The supply of nursing programs expanded. Nurse quality, measured by licensure exam pass rates, declined. Despite this, for each nurse migrant, 9 additional nurses were licensed. New nurses switched from other degree types, but graduated at higher rates than they would have otherwise, increasing the human capital stock in the Philippines.",
-    "full_text": "",
-    "authors": [],
-    "doi": "10.1162/rest_a_01131",
-    "year": null,
-    "item_type": "journalArticle",
-    "url": ""
-  },
-  {
-    "key": "GIQRAEI7",
-    "title": "Returns to International Migration: Evidence from a Bangladesh-Malaysia Visa Lottery",
-    "abstract": "We follow 3,512 (of 1.4 million) applicants to a government lottery that randomly allocated visas to Bangladeshis for low-skilled, temporary labor contracts in Malaysia. Most lottery winners migrate, and their remittance substantially raises their family's standard of living in Bangladesh. The migrant's absence pauses demographic changes (marriage, childbirth, household formation), and shifts decision-making power towards females. Migration removes enterprising individuals, lowering household entrepreneurship, but does not crowd out other family members' labor supply. One group of applicants were offered deferred migration that never materialized. Improved migration prospects induce pre-migration investments in skills that generate no returns in the domestic market.",
-    "full_text": "",
-    "authors": [
-      "Mobarak Ahmed Mushfiq",
-      "Sharif Iffath",
-      "Shrestha Maheshwor"
-    ],
-    "doi": "",
-    "year": null,
-    "item_type": "journalArticle",
-    "url": ""
-  },
-  {
-    "key": "DEFXYBQK",
-    "title": "Role models and migration intentions",
-    "abstract": "Role models\u2014those individuals who resemble us but have achieved more than us\u2014 are thought to impact our aspirations. In this paper, we study the impact of role models on intentions to migrate. Specifically, we implement a randomized controlled trial to show documentaries in rural villages of Mali (Kayes region). These documentaries focus on economic opportunities and show either negative or positive portraits of migrants, or portraits of local people who have successfully set up flourishing businesses without ever considering migration. This paper adds to the larger debate about the efficiency of information provision. We find very few significant impacts, none of which hold when attrition is controlled for using nonparametric Lee bounds. We also implement a treatment heterogeneity analysis using a causal forest algorithm, which aside from confirming our average treatment effects suggests the presence of heterogeneity. It appears that individuals with living conditions that could facilitate migration are less likely to be significantly impacted. The high aspirations to improve living conditions, coupled with a strong feeling of lack of control over the future may help explaining the fact that confrontations with real life experiences do not significantly modify average aspirations to migrate.",
-    "full_text": "",
-    "authors": [
-      "Mespl\u00e9-Somps S",
-      "Nilsson B",
-      "d'Aiglepierre R"
-    ],
-    "doi": "",
-    "year": null,
-    "item_type": "journalArticle",
-    "url": "https://www.cairn-int.info/journal-afd-research-papers-2021-200-page-1.htm"
-  },
-  {
-    "key": "RQXKP6NP",
-    "title": "Broken Promises: Evaluating an Incomplete Cash Transfer Program",
-    "abstract": "Interventions in highly insecure and fragile contexts are always confronted with the latent risk of not being able to implement the program as intended. Despite its high policy relevance, little is known about the impacts of program disruption or cancellation on beneficiaries. This study uses the unplanned cancellation of the South Sudan Youth Business Start-Up Grant Program to assess the socioeconomic, behavioral, and psychological consequences of a program that fails to be implemented as intended. Originally planned as a randomized trial, the Youth Startup Business Grant Program consisted of an unconditional cash grant combined with a business and life skills training targeting the youth in South Sudan. Due to the intensification of violence in the country, the disbursement of the grant was terminated in late 2016 before most of the intended beneficiaries had accessed the grant. The study uses survey data from face-to-face interviews and experimental data from lotteries, trust games, and a list experiment to assess the consequences of the cancellation in a comprehensive form. The empirical analysis employs instrumental variable regressions to control for individual characteristics that might have made it more likely to access the grant before disbursement was frozen. The results show that participants who received the originally planned treatment displayed significant improvements in their consumption, savings, and psychological well-being. However, participants who vainly expected to receive the cash grant showed reduced levels of consumption and women among this subgroup also experienced strong reductions in their trust level. In addition, the study finds some evidence that these women were less likely to migrate.",
-    "full_text": "",
-    "authors": [
-      "Muller Angelika",
-      "Pape Utz Johann",
-      "Ralston Laura R"
-    ],
-    "doi": "",
-    "year": null,
-    "item_type": "journalArticle",
-    "url": ""
-  },
-  {
-    "key": "G79BE4TK",
-    "title": "The Benefits and Costs of Guest Worker Programs: Experimental Evidence from The India-UAE Migration Corridor",
-    "abstract": "We estimate the returns to temporary migration programs using a randomized control trial with several thousand job seekers in India applying to guest worker jobs in the United Arab \u2026",
-    "full_text": "",
-    "authors": [
-      "Naidu S",
-      "Nyarko Y",
-      "Wang SY"
-    ],
-    "doi": "",
-    "year": null,
-    "item_type": "journalArticle",
-    "url": "https://econ.cms.arts.ubc.ca/wp-content/uploads/sites/38/2022/09/20221123_Suresh-Naidu.pdf"
-  },
-  {
-    "key": "5J2Z3L7J",
-    "title": "Do social protection programs foster short-term and long-term migration adaptation strategies?",
-    "abstract": "Abstract We examine how migration is influenced by temperature and precipitation variability, and the extent to which the receipt of a cash transfer affects the use of migration as an adaptation strategy. Climate data is merged with georeferenced panel data (2010\u20132014) on individual migration collected from the Zambian Child Grant Program (CGP) sites. We use the person-year dataset to identify the direct and heterogeneous causal effects of the CGP on mobility. Having access to cash transfers doubles the rate of male, short-distance moves during cool periods, irrespective of wealth. Receipt of cash transfers (among wealthier households) during extreme heat causes an additional retention of males. Cash transfers positively spur long-distance migration under normal climate conditions in the long term. They also facilitate short-distance responses to climate, but not long-distance responses that might be demanded by future climate change.",
-    "full_text": "",
-    "authors": [
-      "Mueller Valerie",
-      "Gray Clark",
-      "Handa Sudhanshu",
-      "Seidenfeld David"
-    ],
-    "doi": "10.1017/S1355770X19000214",
-    "year": null,
-    "item_type": "journalArticle",
-    "url": "https://www.cambridge.org/core/product/identifier/S1355770X19000214/type/journal_article https://www.ncbi.nlm.nih.gov/pmc/articles/PMC7062362/pdf/nihms-1558213.pdf"
-  },
-  {
-    "key": "EX4XE7QK",
-    "title": "Labor Productivity, Remittance Use, and the Impact of the Poverty Alleviation Fund (PAF) Program in Nepal",
-    "abstract": "This dissertation presents three studies related to labor productivity, remittances use, and the effect of an anti-poverty program on migration and remittances. Labor is the biggest endowment available to the poor. Understanding labor issues is important in addressing the problems of poverty, inequality, migration, and economic development. In this dissertation, I estimate the labor productivity of agricultural household because most of the agricultural households in developing countries work in their own farms, it is not possible to observe wages. The first chapter estimates the shadow wage (marginal productivity of labor) of the agricultural household in the context of Nepal. How different is marginal productivity of labor for women compared to men in agricultural households? In developing countries, where most of the families work on their farms, wage or labor-related income cannot be observed directly. This paper contributes to the literature on gender wage difference in labor and development economics by developing a new approach to estimate the shadow wage of agricultural households in Nepal. Using a general functional form, we first derive the shadow wage from a theoretical model. Then, a model with ward-level fixed effects is used to estimate the shadow wage by gender for Nepalese agricultural households. We find that the productivity of women is not that different than that of men. Despite the vast difference in observed market wages for women, the distribution of shadow wages of women is not that different from that of men, calling for policies to increase the market wages for women. The second chapter of this dissertation, attempts to understand the use of remittances among the households of Nepal. Remittances are transfers made by migrant workers to their family and relatives in their country of origin. In Nepal, remittances account for 25-30% of the GDP, and the trend of youths seeking work in other countries--mostly in Southeast Asia and the Middle East--has been increasing. Understanding the expenditure pattern of remittances-receiving households compared to non-recipients provides an understanding of the effect of remittances. In this chapter I employ nationally representative data from Nepal to investigate the effect of remittances on household expenditure patterns, and I compare the prevalence of poverty between remittance recipients and non-recipients. The findings that emerge are as follows: households receiving international and both domestic and international remittances have increased expenditure shares on education, suggesting investments in human capital in the household. In contrast I find a decrease in education expenditures for households receiving domestic remittances. Food expenditures share decreases for households receiving all types of remittances. Households receiving remittances increase the expenditure shares on durables and other consumption expenditures. Households receiving remittances have decreased shares in health expenditures. With regards to poverty, the paper shows that receiving remittances reduces the likelihood of being poor. In the third chapter of the dissertation, I evaluate the effects of the Poverty Alleviation Fund program (PAF) on remittances and migration using the data from a quasi-experiment. The PAF is a social fund program that has been providing services to marginalized communities in Nepal through various income-generating activities since 2006. Unlike previous research that has used conditional cash transfer programs (CCTs) to study the role of a development program on migration and remittances, I employ the data from the community-driven anti-poverty program that provides income-generating activities to participants. Using a panel dataset collected by Center for Economic Development and Administration (CEDA) of the Tribhuwan University and the PAF, and taking advantage of a quasi-randomized phase-in experimental design, I estimate the causal effects of a development program on remittances, migration, and welfare measures. I show that policy makers shou d be aware that community-driven development programs have unintended consequences for migration and remittances, which are distinct from the primary goals of the program: alleviating poverty and improving food security. The program results in a decrease of approximately Rs.6000 (approximately six percent of total household consumption) in remittances received, crowding out private transfers in the presence of public transfers. The paper shows an increase in domestic migration, but no change in international migration due to the program.",
-    "full_text": "",
-    "authors": [
-      "Nepal Atul"
-    ],
-    "doi": "",
-    "year": null,
-    "item_type": "journalArticle",
-    "url": ""
-  },
-  {
-    "key": "QJH23MCD",
-    "title": "Safe Migration Awareness Campaign In Rural Communities Of Nigeria, The Procedure And Impacts",
-    "abstract": "International migration is undergoing unprecedented changes. The traditional determinants of migration such as poverty, food insecurity and climate change are giving way to new motivations. These new issues, that include but are not limited to ambitions to live a foreign lifestyle, incomplete and asymmetric information are capable of underestimating the risk in irregular migration. As the information about foreign lifestyle flow freely and new opportunities open, it becomes very difficult to manage irregular migration through border control. Within the transitional mode of international migration, the use of awareness campaigns, especially in rural areas of home countries that target the most vulnerable groups, \u2013 school-age youths, could become a veritable means of deterring irregular migration. In 2018, Ricosmigration \u2013 Rural Information Campaign on Safe Migration - received funding from the German Foreign Office to investigate why young people from Nigeria migrate irregularly and implement a safe migration awareness campaign for youth in rural secondary schools. This report is from the result of the project which cut across interviews of Nigerian migrants living in Italy, potential migrants in Nigeria, and the result of the awareness campaigns conducted in 10 secondary schools in Edo, Nigeria. In the report, we explain the profile of a potential migrant from Nigeria. We also explore how reduced capabilities to lead the desired life and how the increasing use of social media internet has greatly raised the likelihood of migration in Nigeria. We equally show in the detail how we implemented a randomized experiment to test the efficiency of the migration awareness campaign. The project provides a new dimension to the discourse of the root cause of migration by introducing the role of limited opportunities and freedom (capabilities), low life satisfaction, and incomplete information through social media. Additionally, it shows the power of light interventions such as awareness campaigns in reducing irregular migration. In particular, the result showed that about 77.2 per cent of Nigerian youths that responded to the interview have the intention to migrate abroad, and 37.2 per cent would migrate if they win a cash lottery that is enough to cover the migration cost. Our randomized experiment showed that migration awareness campaign could reduce the risk of being a victim of human trafficking by more than 50 per cent. It could also reduce the desire to engage in irregular migration by more than 30 per cent and increased the decision to take necessary steps to avoid human traffickers and follow proper procedures for safe migration by more than 50 per cent. The awareness campaign had a wide coverage reaching about 7000 students in rural communities in Edo State, Nigeria. The success factors of our awareness campaign include the utilization of appropriate channels, delivery of an accurate message that was tailored to the group we spoke to, and the use of respected external facilitators.",
-    "full_text": "",
-    "authors": [
-      "Obi Chinedu"
-    ],
-    "doi": "",
-    "year": null,
-    "item_type": "journalArticle",
-    "url": "https://search.ebscohost.com/login.aspx?direct=true&db=edsrep&AN=edsrep.p.osf.socarx.v3kn2&site=eds-live"
-  },
-  {
-    "key": "PM9LIPT3",
-    "title": "Labour migration and households: A reconsideration of the effects of the social pension on labour supply in South Africa",
-    "abstract": "This paper re-examines the effect of the South African social pension on the labour supply of working-age adults using data from 1993. We take account of the fact that households may include non-resident members, and therefore the pension may play a role in facilitating migration to work or look for work. We find that rural African women are significantly more likely to be migrant workers when they are members of a household in receipt of a pension, and that it is female pension income that drives this result. We explore a number of possible reasons why pension income might have this effect.",
-    "full_text": "",
-    "authors": [
-      "Posel D",
-      "Fairburn J A",
-      "Lund F"
-    ],
-    "doi": "10.1016/j.econmod.2005.10.010",
-    "year": null,
-    "item_type": "journalArticle",
-    "url": ""
-  },
-  {
-    "key": "X835X4JX",
-    "title": "Raising Awareness About the Risk of Irregular Migration: Quasi-Experimental Evidence from Guinea",
-    "abstract": "In response to mounting evidence of harm inflicted on irregular migrants along their journeys from West Africa to Europe, international organizations, civil society organizations, and governments have scaled up campaigns as a tool for raising awareness about the risks of irregular migration. Campaigns aim to counter misinformation by smugglers and facilitate safe migration decisions. Despite the growing number of interventions, there is limited empirical evidence on the impact and effectiveness of such campaigns. Based on a difference-in-difference design, this study investigates the effect of a mobile cinema and community discussion intervention on the perceptions, knowledge, and intentions of potential irregular migrants in Northern Guinea in 2019. The results show that potential migrants who participated in events were significantly more likely to show awareness gains and less likely to report high intentions to migrate irregularly. While the relative importance of risk perceptions and their impact on migration flows remain unclear, the findings provide evidence supporting the assumption that risk awareness can be a relevant factor in the decision-making process of potential irregular migrants. While campaigns may be an effective tool in certain contexts, effect sizes highlight the need for policymakers to keep realistic expectations.",
-    "full_text": "",
-    "authors": [
-      "Tjaden J",
-      "Gninafon H"
-    ],
-    "doi": "10.1111/padr.12468",
-    "year": null,
-    "item_type": "journalArticle",
-    "url": ""
-  },
-  {
-    "key": "EZTFJFFS",
-    "title": "Household Structure and Short-Run Economic Change in Nicaragua",
-    "abstract": "During the economic crises Nicaragua suffered between 2000 and 2002, a conditional cash transfer program targeting poor households began operating. Using panel data on 1,397 households from the program's experimentally designed evaluation, we examined the impact of the program on household structure. Our findings suggest that the program enabled households to avoid reagglomeration during the economic crises, with households in control communities growing more than treated households. These changes were driven primarily by shifts in residence of relatively young men and women with close kinship ties to the household head. In contrast, households that received transfers continued to send off young adult members, suggesting that the program provided resources to overcome the short-term economic pressures on household structure.",
-    "full_text": "",
-    "authors": [
-      "Winters P",
-      "Stecklov G",
-      "Todd J"
-    ],
-    "doi": "10.1111/j.1741-3737.2009.00628.x",
-    "year": null,
-    "item_type": "journalArticle",
-    "url": ""
-  },
-  {
-    "key": "G9HHCW5Z",
-    "title": "Empowering Indonesian Migrant Workers to Access Quality Overseas Placement Services",
-    "abstract": "Nearly 700,000 Indonesians migrate abroad for work each year. The vast majority do so through recruiters and placement agencies that facilitate temporary employment in countries across Asia and the Middle East. These agencies support migrants starting with pre-departure paperwork and training through repatriation, and are therefore a crucial determinant of a worker\u2019s migration experience. Potential migrants ostensibly have a great deal of choice between agencies \u2013 there are over 1,000 formally registered firms in Indonesia \u2013 and in theory, competition between these firms should drive out poorly performing agencies. Yet anecdotal evidence suggests that agency quality is highly variable, and that many agencies engage in exploitative practices. This could be due to market power at the local level, or informational failures, both of which would hamper competitive pressures.\nOur findings from preliminary research suggest that despite the fact that nearly three-quarters of female migrants believe that there is no relationship between the quality of the agencies and the experience with the employer; there is indeed a robust correlation between the two variables. However, migrants attribute the employer quality to \"nasib\", or fate.\nIn 2015, we ran information campaigns designed to transmit information on agency quality to potential migrants. Surveys will be conducted to evaluate the impact of the information campaigns on migrants\u2019 outcomes.",
-    "full_text": "",
-    "authors": [
-      "Schaner Simone",
-      "Cameron Lisa",
-      "Bazzi Samuel",
-      "Kartaadipoetra Firman Witoelar"
-    ],
-    "doi": "",
-    "year": null,
-    "item_type": "journalArticle",
-    "url": "https://www.socialscienceregistry.org/trials/630"
-  },
-  {
-    "key": "SNG5JMCQ",
-    "title": "The impact of providing vocational training to young men on labour outcomes and attitudes towards migration in northern Guinea-Bissau",
-    "abstract": "As in most of Sub-Saharan Africa, the lack of quality employment among the rural youth is threatening economic development and inclusive growth, with employment search arguably working as an important driver for both internal and international migration. Active labour market policies, such as vocational trainings, are frequently chosen by governments, international institutions and NGOs as a potential solution to these labour market frictions. Nevertheless, the causal evidence determining the impact of these programs on the youth of rural areas is scarce in the sub-region, and inexistent in Guinea-Bissau. In this project, we run a randomized controlled trial within the GOT project implemented by the NGO ENGIM. This project provides vocational training courses on professional skills thought to be particularly relevant in the local context, and facilitates traineeships in local businesses for young men in two northern regions of the country, aiming to prevent their engagement in irregular migration practices. Assessing the impact of the GOT project on the employment rates, income and attitudes towards migrations of its trainees should contribute to a better understanding of the impact of active labour market policies in rural areas of low income countries, facilitating a better design, implementation and evaluation of such programmes in Guinea-Bissau and similar contexts.",
-    "full_text": "",
-    "authors": [],
-    "doi": "10.1257/rct.6890-1.2",
-    "year": null,
-    "item_type": "journalArticle",
-    "url": "https://www.socialscienceregistry.org/trials/6890"
-  },
-  {
-    "key": "QYAQM7H9",
-    "title": "Weather Insurance and Investment Choice",
-    "abstract": "Exposure to the risk of extreme weather conditions has been shown to constrain investment\nby subsistence farmers in developing countries and may lead to ine\u00a2cient production choices.\nThis paper evaluates whether insuring farmers against such risks alters resource allocation decisions. In particular I consider the e\u00a7ects of a Mexican government disaster relief program with\ninsurance-like features. The results, based on a regression discontinuity design, indicate that\ninsurance against losses arising from natural disasters changes how rural households invest in\ntheir farms. Insured farmers utilize more expensive capital inputs and adopt di\u00a7erent technologies. Additionally, the insurance changes labor supply patterns. Notably, members of insured\nhouseholds are approximately 10% more likely to migrate internationally. Additional results,\nthat the program matters most when the returns to migration are more unpredictable, are\nconsistent with a model where insurance obviates the need for precautionary savings, allowing\nhouseholds to \u00d6nance international migration.",
-    "full_text": "",
-    "authors": [
-      "Shapiro J"
-    ],
-    "doi": "",
-    "year": null,
-    "item_type": "journalArticle",
-    "url": ""
-  },
-  {
-    "key": "8EFH4AP4",
-    "title": "Can Public Transfers Reduce Mexican Migration? A study based on randomized experimental data",
-    "abstract": "Prior research on Mexican migration has shown that social networks and economic incentives play an important role in determining migration outcomes. This study utilizes experimental data on PROGRESA, Mexico's primary poverty reduction program, to evaluate the effects of public cash transfers on migration. Our study complements a growing body of literature aimed at overcoming longstanding hurdles towards the establishment of causal validity in empirical studies of migration. We find that public cash transfers reduce US migration but have little effect on domestic migration. Furthermore, we find that the provision of cash transfers appears to reduce migration partly by reducing the relative deprivation levels of poor households. Finally, we find that the effect of public cash transfers on US migration depend on the size of existing US migration networks. Surprisingly, we see that transfers have larger (more negative) effects on US migration in communities with large existing networks. The results suggest that public transfers may be helpful in managing rural out-migration, particularly to the US. Interestingly, such programs may be most effective if they are targeted towards communities with strong existing migration patterns.",
-    "full_text": "",
-    "authors": [
-      "Stecklov Guy",
-      "Stampini Marco",
-      "Davis Benjamin"
-    ],
-    "doi": "",
-    "year": null,
-    "item_type": "journalArticle",
-    "url": ""
-  },
-  {
-    "key": "5M6JE7W5",
-    "title": "Do Conditional Cash Transfers Influence Migration? A Study Using Experimental Data From The Mexican PROGRESA Program",
-    "abstract": "Prior research on Mexican migration has shown that social networks and economic incentives play an important role in determining migration outcomes. We use experimental data from PROGRESA, Mexico's primary poverty-reduction program, to evaluate the effects of conditional cash transfers on migration both domestically and to the United States. Our study complements a growing body of literature aimed at overcoming longstanding hurdles to the establishment of causal validity in empirical studies of migration. Analysis based on the data collected before and after the program 's onset shows that conditional transfers reduce U.S. migration but not domestic migration. The data also enable us to explore the role of existing family and community migration networks. The results show that migration networks strongly influence migration, but that the effect of conditional transfers on migration is apparently not mediated by existing migration network structures. Our results suggest that conditional transfers may be helpful in managing rural out-migration, particularly to the United States.",
-    "full_text": "",
-    "authors": [
-      "Stecklov Guy",
-      "Winters Paul",
-      "Stampini Marco",
-      "Davis Benjamin"
-    ],
-    "doi": "",
-    "year": null,
-    "item_type": "journalArticle",
-    "url": "https://www.jstor.org/stable/4147339?seq=1#page_scan_tab_contents"
-  },
-  {
-    "key": "DG5T267N",
-    "title": "Cash transfers and migration: theory and evidence from a randomized controlled trial",
-    "abstract": "Will the fast expansion of cash-based programming in developing countries increase international migration? Theoretically, cash transfers may favor international migration by relaxing liquidity, credit, and risk constraints. But transfers, especially those conditional upon staying at home, may also increase the opportunity cost of migrating abroad. This paper evaluates the impact of a cash-for-work program on migration. Randomly selected households in Comoros were offered up to US$320 in cash in exchange for their participation in public works projects. We find that the program increased migration to Mayotte - the neighboring and richer French Island - by 38 percent, from 7.8% to 10.8%. The increase in migration is explained by the alleviation of liquidity and risk constraints, and by the fact that the program did not increase the opportunity cost of migration for likely migrants.",
-    "full_text": "",
-    "authors": [
-      "Sterck O",
-      "Gazeaud J",
-      "Mvukiyehe E"
-    ],
-    "doi": "",
-    "year": null,
-    "item_type": "journalArticle",
-    "url": "https://www.csae.ox.ac.uk/materials/papers/csae-wps-2019-16.pdf"
-  },
-  {
-    "key": "CAJ5PJQW",
-    "title": "The impact of Indian SHGs: a long-run field experiment in Jharkhand",
-    "abstract": "This field experiment randomized access to Self-Help Groups in villages spread over the entire state of Jharkhand and surveyed a sample of 1,080 households three times between 2004 and 2009, in order to evaluate the changes in their living standards. We study impacts on children education and labor, household consumption and risk-coping behavior (including migration), and local credit markets.",
-    "full_text": "",
-    "authors": [],
-    "doi": "10.1257/rct.5570-1.1",
-    "year": null,
-    "item_type": "journalArticle",
-    "url": "https://www.socialscienceregistry.org/trials/5570"
-  },
-  {
-    "key": "MHIY5NJJ",
-    "title": "The value of forecasts: Experimental evidence from developing-country agriculture",
-    "abstract": "Climate risk is a key driver of low agricultural productivity in poor countries. We use a cluster-randomized trial to evaluate a novel risk-mitigation approach: long-range forecasts that provide information about the onset of the Indian summer monsoon well in advance of its arrival. In contrast to traditional approaches that allow farmers to cope with risk ex post, this new ex ante technology provides accurate information at least one month in advance of the monsoon's arrival, enabling farmers to alter cropping choices and other up front input decisions. Moreover, forecasts have the potential to be disseminated cheaply, even at scale. We assign 250 villages to one of three groups: a control group; a group that is given an opportunity to purchase the forecast; and a group that is offered insurance. This design allows us to investigate farmers' willingness-to-pay for forecasts; measure how forecasts affect farmer beliefs, up-front investments, and welfare; and study how these effects compare to the canonical ex post loss mitigation tool: weather-based index insurance.",
-    "full_text": "",
-    "authors": [],
-    "doi": "10.1257/rct.8846-1.0",
-    "year": null,
-    "item_type": "journalArticle",
-    "url": "https://www.socialscienceregistry.org/trials/8846"
-  },
-  {
-    "key": "YYL2HIQB",
-    "title": "Investments in Human Capital: Long-term Effects of Progresa-Oportunidades on Poverty and Migration in Rural Mexico.",
-    "abstract": "This paper evaluates the effects on poverty reduction and migration of a conditional cash transfer program in Mexico named Oportunidades (previously Progresa). This program, the first in Latin America and the most imitated of its kind, was intended to increase human capital, which would eventually translate into poverty reduction. Linear and non-linear panel models are used to explore whether there are any such effects, and the implications for the effectiveness and evaluation strategies of the program. No significant effects of Progresa-Oportunidades in reducing income poverty or affecting international migration were found at the rural level. However, there is a weak effect in the case of domestic migration. As data continues to become available through Mexico's official Secretariat of Social Development, there will be more opportunities for further exploration of the relationship between this program, poverty alleviation, and migration outcomes. Limitations and further recommendations for this study are also discussed.",
-    "full_text": "",
-    "authors": [
-      "TIRADO J ALEJANDRO"
-    ],
-    "doi": "",
-    "year": null,
-    "item_type": "journalArticle",
-    "url": "https://search.ebscohost.com/login.aspx?direct=true&profile=ehost&scope=site&authtype=crawler&jrnl=20672640&AN=113660670&h=tw80U6FJzYcJYu3fTX%2BMPrdXbXrYCOOX2ZDxlHcnJdmg5T13YEukzyFOx75iYT%2F%2BuqTBgG5p2dwmyl3bwBylKg%3D%3D&crl=c"
-  },
-  {
-    "key": "X2YYD8XC",
-    "title": "The effect of peer-to-peer risk information on potential migrants ' Evidence from a randomized controlled trial in Senegal",
-    "abstract": "In response to mounting evidence on the dangers of irregular migration from Africa to Europe, the number of information campaigns which aim to raise awareness about the potential risks has rapidly increased. Governments, international organizations and civil society organizations implement a variety of campaigns to counter the spread of misinformation accelerated by smuggling and trafficking networks. The evidence on the effects of such information interventions on potential migrants remains limited and largely anecdotal. More generally, the role of risk perceptions in the decision-making process of potential irregular migrants is rarely explicitly tested, despite the fact that the concept of risk pervades conventional migration models, particularly in the field of economics. We address this gap by assessing the effects of a peer-to-peer information intervention on the perceptions, knowledge and intentions of potential migrants in Dakar, Senegal, using a randomized controlled trial design. The results show that--three months after the intervention--peer-to-peer information events increase potential migrants' subjective information levels, raise risk awareness, and reduce intentions to migrate irregularly. We find no substantial effects on factual migration knowledge. We discuss how the effects may be driven by the trust and identification-enhancing nature of peer-to-peer communication.",
-    "full_text": "",
-    "authors": [
-      "Tjaden Jasper",
-      "Dunsch Felipe Alexander"
-    ],
-    "doi": "10.1016/j.worlddev.2021.105488",
-    "year": null,
-    "item_type": "journalArticle",
-    "url": "https://linkinghub.elsevier.com/retrieve/pii/S0305750X21001005"
-  },
-  {
-    "key": "FC8EU2Q3",
-    "title": "Universal Basic Income in Kenya",
-    "abstract": "A universal basic income (UBI) is a recurring, unconditional cash transfer sized to meet basic needs and paid to all members of a society. Proponents argue that a UBI has the potential to eliminate extreme poverty and to counteract the harmful effects of rising inequality in wealthier countries. Interest has surged, with UBI actively debated in countries ranging from Switzerland and Finland to Namibia and India. Yet, while cash transfers in general have a strong evidence base, a full basic income has never been implemented or rigorously evaluated. This study proposes to fill these evidence gaps with an ambitious long-term randomized control trial in Kenya. The core objective is to test the hypothesis that a universal basic income is an effective way to eliminate extreme global poverty. This is a central policy question currently being debated in a number of emerging markets, and is also highly relevant for foreign aid policy given that the global poverty gap has fallen to $80B a year as of 2015, less than half of official development assistance flows. Positive results could shift public spending away from in-kind and means-tested programs, while negative ones could have the opposite effect. As a secondary goal, the study also aims to inform debate on the role of UBI in wealthy countries. While the populations are obviously different from those we will work with in East Africa, many of the core questions about human behavior are the same ? does economic security motivate people to work more or less? To socialize more or less? etc. At a minimum, positive results from a low-cost emerging-market evaluation could be motivator for testing more expensive guarantees in richer countries. Finally, it is worth emphasizing that in the process of producing this evidence the project will also directly benefit some of the poorest people on the planet by delivering cash transfers to them. The broader evidence base on cash transfers suggests that these recipients will reap life-changing benefits from participating in the project.",
-    "full_text": "",
-    "authors": [],
-    "doi": "10.1257/rct.1952-2.1",
-    "year": null,
-    "item_type": "journalArticle",
-    "url": "https://www.socialscienceregistry.org/trials/1952"
-  },
-  {
-    "key": "UX36F5C2",
-    "title": "Liquidity Constraints and Migration: Evidence from Indonesia",
-    "abstract": "Although liquidity constraints have been seen as both a factor limiting individuals from migrating and a motivation for households to send a migrant, the consequences of relaxing liquidity constraints on migration behavior have not been adequately explored due to data limitations. In this study, we take advantage of an unusual policy, Bantuan Langsung Tunai -- a national-level unconditional cash transfer program targeted toward the poorest households in Indonesia -- to empirically assess the impact of increased liquidity on the migration behavior of poor Indonesian households.With a highly mobile population and a long history of circular migration, Indonesia is an ideal space to study migration. Using panel data from the Indonesian Family Life Survey, the results demonstrate that a positive liquidity shock increases the probability of migration among low-asset households, among households with a migration history, and, most significantly, among lowasset households with a migration history. [ABSTRACT FROM AUTHOR] Copyright of International Migration Review is the property of Sage Publications Inc. and its content may not be copied or emailed to multiple sites or posted to a listserv without the copyright holder's express written permission. However, users may print, download, or email articles for individual use. This abstract may be abridged. No warranty is given about the accuracy of the copy. Users should refer to the original published version of the material for the full abstract. (Copyright applies to all Abstracts.)",
-    "full_text": "",
-    "authors": [
-      "Tiwari Smriti",
-      "Winters Paul C"
-    ],
-    "doi": "10.1177/0197918318768555",
-    "year": null,
-    "item_type": "journalArticle",
-    "url": "http://journals.sagepub.com/doi/10.1177/0197918318768555"
-  }
-]

data/gene_xpert_zotero_items.json CHANGED Viewed

@@ -13,7 +13,7 @@
       "Hairong Huang"
     ],
     "doi": "10.21037/jtd.2018.02.60",
-    "date": "3/2018",
     "item_type": "journalArticle",
     "url": "http://jtd.amegroups.com/article/view/19447/15515"
   },
@@ -33,7 +33,7 @@
       "David W. Dowdy"
     ],
     "doi": "10.1097/QAI.0000000000000712",
-    "date": "2015-09-1",
     "item_type": "journalArticle",
     "url": "https://journals.lww.com/00126334-201509010-00011"
   },
@@ -52,7 +52,7 @@
       "Sydney Rosen"
     ],
     "doi": "10.1111/j.1365-3156.2012.03028.x",
-    "date": "09/2012",
     "item_type": "journalArticle",
     "url": "https://onlinelibrary.wiley.com/doi/10.1111/j.1365-3156.2012.03028.x"
   },
@@ -75,7 +75,7 @@
       "Keertan Dheda"
     ],
     "doi": "10.1183/09031936.00145511",
-    "date": "07/2012",
     "item_type": "journalArticle",
     "url": "http://erj.ersjournals.com/lookup/doi/10.1183/09031936.00145511"
   },
@@ -94,7 +94,7 @@
       "Achilles Katamba"
     ],
     "doi": "10.1186/s12913-016-1804-9",
-    "date": "12/2016",
     "item_type": "journalArticle",
     "url": "http://bmchealthservres.biomedcentral.com/articles/10.1186/s12913-016-1804-9"
   },
@@ -115,7 +115,7 @@
       "A. H. Van'T Hoog"
     ],
     "doi": "10.5588/ijtld.16.0496",
-    "date": "2017-04-01",
     "item_type": "journalArticle",
     "url": "http://www.ingentaconnect.com/content/10.5588/ijtld.16.0496"
   },
@@ -138,7 +138,7 @@
       "Julio Croda"
     ],
     "doi": "10.1093/cid/ciaa135",
-    "date": "2021-03-01",
     "item_type": "journalArticle",
     "url": "https://academic.oup.com/cid/article/72/5/771/5736588"
   },
@@ -154,7 +154,7 @@
       "Anete Trajman"
     ],
     "doi": "10.1590/s1806-37562015000004524",
-    "date": "12/2015",
     "item_type": "journalArticle",
     "url": "http://www.scielo.br/scielo.php?script=sci_arttext&pid=S1806-37132015000600536&lng=en&tlng=en"
   },
@@ -181,7 +181,7 @@
       "Keertan Dheda"
     ],
     "doi": "10.1016/S2214-109X(19)30164-0",
-    "date": "06/2019",
     "item_type": "journalArticle",
     "url": "https://linkinghub.elsevier.com/retrieve/pii/S2214109X19301640"
   },
@@ -206,7 +206,7 @@
       "Luis E Cuevas"
     ],
     "doi": "10.1136/bmjgh-2021-007592",
-    "date": "02/2022",
     "item_type": "journalArticle",
     "url": "https://gh.bmj.com/lookup/doi/10.1136/bmjgh-2021-007592"
   },
@@ -222,7 +222,7 @@
       "Elvira Richter"
     ],
     "doi": "10.1183/13993003.01333-2015",
-    "date": "02/2016",
     "item_type": "journalArticle",
     "url": "http://erj.ersjournals.com/lookup/doi/10.1183/13993003.01333-2015"
   },
@@ -244,7 +244,7 @@
       "Susan Cleary"
     ],
     "doi": "10.1371/journal.pone.0251547",
-    "date": "2021-5-14",
     "item_type": "journalArticle",
     "url": "https://dx.plos.org/10.1371/journal.pone.0251547"
   },
@@ -260,7 +260,7 @@
       "M. Shah"
     ],
     "doi": "10.5588/ijtld.13.0095",
-    "date": "2013-10-01",
     "item_type": "journalArticle",
     "url": "http://openurl.ingenta.com/content/xref?genre=article&issn=1027-3719&volume=17&issue=10&spage=1328"
   },
@@ -285,7 +285,7 @@
       "Jacob Creswell"
     ],
     "doi": "10.3201/eid2703.204090",
-    "date": "03/2021",
     "item_type": "journalArticle",
     "url": "https://wwwnc.cdc.gov/eid/article/27/3/20-4090_article.htm"
   },
@@ -300,7 +300,7 @@
       "A. Trajman"
     ],
     "doi": "10.5588/ijtld.13.0637",
-    "date": "2014-05-01",
     "item_type": "journalArticle",
     "url": "http://openurl.ingenta.com/content/xref?genre=article&issn=1027-3719&volume=18&issue=5&spage=547"
   },
@@ -317,7 +317,7 @@
       "Deborah K. Glencross"
     ],
     "doi": "10.4102/ajlm.v10i1.1229",
-    "date": "2021-11-30",
     "item_type": "journalArticle",
     "url": "http://www.ajlmonline.org/index.php/AJLM/article/view/1229"
   },
@@ -337,7 +337,7 @@
       "Maria Claudia Vater"
     ],
     "doi": "10.1590/0037-8682-0082-2018",
-    "date": "10/2018",
     "item_type": "journalArticle",
     "url": "http://www.scielo.br/scielo.php?script=sci_arttext&pid=S0037-86822018000500631&tlng=en"
   },
@@ -361,7 +361,7 @@
       "Luis E. Cuevas"
     ],
     "doi": "10.1128/JCM.00864-15",
-    "date": "08/2015",
     "item_type": "journalArticle",
     "url": "https://journals.asm.org/doi/10.1128/JCM.00864-15"
   },
@@ -386,7 +386,7 @@
       "Corinne S. Merle"
     ],
     "doi": "10.1371/journal.pone.0264206",
-    "date": "2022-2-22",
     "item_type": "journalArticle",
     "url": "https://dx.plos.org/10.1371/journal.pone.0264206"
   },
@@ -406,7 +406,7 @@
       "Prathap Tharyan"
     ],
     "doi": "10.1371/journal.pone.0205233",
-    "date": "2018-10-29",
     "item_type": "journalArticle",
     "url": "https://dx.plos.org/10.1371/journal.pone.0205233"
   },
@@ -423,7 +423,7 @@
       "Susan E Dorman"
     ],
     "doi": "10.1186/1471-2334-13-352",
-    "date": "12/2013",
     "item_type": "journalArticle",
     "url": "https://bmcinfectdis.biomedcentral.com/articles/10.1186/1471-2334-13-352"
   },
@@ -450,7 +450,7 @@
       "Frank Cobelens"
     ],
     "doi": "10.1371/journal.pmed.1001120",
-    "date": "2011-11-8",
     "item_type": "journalArticle",
     "url": "https://dx.plos.org/10.1371/journal.pmed.1001120"
   },
@@ -468,7 +468,7 @@
       "Achilles Katamba"
     ],
     "doi": "10.1371/journal.pone.0122574",
-    "date": "2015-4-1",
     "item_type": "journalArticle",
     "url": "https://dx.plos.org/10.1371/journal.pone.0122574"
   },
@@ -486,7 +486,7 @@
       "Brittany Moore"
     ],
     "doi": "10.1007/s40258-018-0397-3",
-    "date": "8/2018",
     "item_type": "journalArticle",
     "url": "http://link.springer.com/10.1007/s40258-018-0397-3"
   },
@@ -502,7 +502,7 @@
       "Charoen Chuchottaworn"
     ],
     "doi": "10.1016/j.vhri.2019.09.010",
-    "date": "05/2020",
     "item_type": "journalArticle",
     "url": "https://linkinghub.elsevier.com/retrieve/pii/S221210992030008X"
   },
@@ -519,7 +519,7 @@
       "Kevin Schwartzman"
     ],
     "doi": "10.1371/journal.pone.0150119",
-    "date": "2016-3-18",
     "item_type": "journalArticle",
     "url": "https://dx.plos.org/10.1371/journal.pone.0150119"
   },
@@ -533,7 +533,7 @@
       "Alemayehu Hailu"
     ],
     "doi": "10.1371/journal.pone.0259056",
-    "date": "2021-10-25",
     "item_type": "journalArticle",
     "url": "https://dx.plos.org/10.1371/journal.pone.0259056"
   },
@@ -555,7 +555,7 @@
       "Esther Turunga"
     ],
     "doi": "10.1097/QAI.0000000000002371",
-    "date": "2020-07-1",
     "item_type": "journalArticle",
     "url": "https://journals.lww.com/10.1097/QAI.0000000000002371"
   },
@@ -575,7 +575,7 @@
       "Jos\u00e9 Mar\u00eda Ten\u00edas-Burillo"
     ],
     "doi": "10.1016/j.eimc.2016.06.009",
-    "date": "08/2017",
     "item_type": "journalArticle",
     "url": "https://linkinghub.elsevier.com/retrieve/pii/S0213005X16301550"
   },
@@ -595,7 +595,7 @@
       "Jos\u00e9 Mar\u00eda Ten\u00edas-Burillo"
     ],
     "doi": "10.1016/j.eimc.2016.06.009",
-    "date": "08/2017",
     "item_type": "journalArticle",
     "url": "https://linkinghub.elsevier.com/retrieve/pii/S0213005X16301550"
   },
@@ -611,7 +611,7 @@
       "Nelson L.S. Lee"
     ],
     "doi": "10.1016/j.jinf.2014.12.015",
-    "date": "04/2015",
     "item_type": "journalArticle",
     "url": "https://linkinghub.elsevier.com/retrieve/pii/S016344531500002X"
   }

       "Hairong Huang"
     ],
     "doi": "10.21037/jtd.2018.02.60",
+    "year": null,
     "item_type": "journalArticle",
     "url": "http://jtd.amegroups.com/article/view/19447/15515"
   },
       "David W. Dowdy"
     ],
     "doi": "10.1097/QAI.0000000000000712",
+    "year": null,
     "item_type": "journalArticle",
     "url": "https://journals.lww.com/00126334-201509010-00011"
   },
       "Sydney Rosen"
     ],
     "doi": "10.1111/j.1365-3156.2012.03028.x",
+    "year": null,
     "item_type": "journalArticle",
     "url": "https://onlinelibrary.wiley.com/doi/10.1111/j.1365-3156.2012.03028.x"
   },
       "Keertan Dheda"
     ],
     "doi": "10.1183/09031936.00145511",
+    "year": null,
     "item_type": "journalArticle",
     "url": "http://erj.ersjournals.com/lookup/doi/10.1183/09031936.00145511"
   },
       "Achilles Katamba"
     ],
     "doi": "10.1186/s12913-016-1804-9",
+    "year": null,
     "item_type": "journalArticle",
     "url": "http://bmchealthservres.biomedcentral.com/articles/10.1186/s12913-016-1804-9"
   },
       "A. H. Van'T Hoog"
     ],
     "doi": "10.5588/ijtld.16.0496",
+    "year": null,
     "item_type": "journalArticle",
     "url": "http://www.ingentaconnect.com/content/10.5588/ijtld.16.0496"
   },
       "Julio Croda"
     ],
     "doi": "10.1093/cid/ciaa135",
+    "year": null,
     "item_type": "journalArticle",
     "url": "https://academic.oup.com/cid/article/72/5/771/5736588"
   },
       "Anete Trajman"
     ],
     "doi": "10.1590/s1806-37562015000004524",
+    "year": null,
     "item_type": "journalArticle",
     "url": "http://www.scielo.br/scielo.php?script=sci_arttext&pid=S1806-37132015000600536&lng=en&tlng=en"
   },
       "Keertan Dheda"
     ],
     "doi": "10.1016/S2214-109X(19)30164-0",
+    "year": null,
     "item_type": "journalArticle",
     "url": "https://linkinghub.elsevier.com/retrieve/pii/S2214109X19301640"
   },
       "Luis E Cuevas"
     ],
     "doi": "10.1136/bmjgh-2021-007592",
+    "year": null,
     "item_type": "journalArticle",
     "url": "https://gh.bmj.com/lookup/doi/10.1136/bmjgh-2021-007592"
   },
       "Elvira Richter"
     ],
     "doi": "10.1183/13993003.01333-2015",
+    "year": null,
     "item_type": "journalArticle",
     "url": "http://erj.ersjournals.com/lookup/doi/10.1183/13993003.01333-2015"
   },
       "Susan Cleary"
     ],
     "doi": "10.1371/journal.pone.0251547",
+    "year": null,
     "item_type": "journalArticle",
     "url": "https://dx.plos.org/10.1371/journal.pone.0251547"
   },
       "M. Shah"
     ],
     "doi": "10.5588/ijtld.13.0095",
+    "year": null,
     "item_type": "journalArticle",
     "url": "http://openurl.ingenta.com/content/xref?genre=article&issn=1027-3719&volume=17&issue=10&spage=1328"
   },
       "Jacob Creswell"
     ],
     "doi": "10.3201/eid2703.204090",
+    "year": null,
     "item_type": "journalArticle",
     "url": "https://wwwnc.cdc.gov/eid/article/27/3/20-4090_article.htm"
   },
       "A. Trajman"
     ],
     "doi": "10.5588/ijtld.13.0637",
+    "year": null,
     "item_type": "journalArticle",
     "url": "http://openurl.ingenta.com/content/xref?genre=article&issn=1027-3719&volume=18&issue=5&spage=547"
   },
       "Deborah K. Glencross"
     ],
     "doi": "10.4102/ajlm.v10i1.1229",
+    "year": null,
     "item_type": "journalArticle",
     "url": "http://www.ajlmonline.org/index.php/AJLM/article/view/1229"
   },
       "Maria Claudia Vater"
     ],
     "doi": "10.1590/0037-8682-0082-2018",
+    "year": null,
     "item_type": "journalArticle",
     "url": "http://www.scielo.br/scielo.php?script=sci_arttext&pid=S0037-86822018000500631&tlng=en"
   },
       "Luis E. Cuevas"
     ],
     "doi": "10.1128/JCM.00864-15",
+    "year": null,
     "item_type": "journalArticle",
     "url": "https://journals.asm.org/doi/10.1128/JCM.00864-15"
   },
       "Corinne S. Merle"
     ],
     "doi": "10.1371/journal.pone.0264206",
+    "year": null,
     "item_type": "journalArticle",
     "url": "https://dx.plos.org/10.1371/journal.pone.0264206"
   },
       "Prathap Tharyan"
     ],
     "doi": "10.1371/journal.pone.0205233",
+    "year": null,
     "item_type": "journalArticle",
     "url": "https://dx.plos.org/10.1371/journal.pone.0205233"
   },
       "Susan E Dorman"
     ],
     "doi": "10.1186/1471-2334-13-352",
+    "year": null,
     "item_type": "journalArticle",
     "url": "https://bmcinfectdis.biomedcentral.com/articles/10.1186/1471-2334-13-352"
   },
       "Frank Cobelens"
     ],
     "doi": "10.1371/journal.pmed.1001120",
+    "year": null,
     "item_type": "journalArticle",
     "url": "https://dx.plos.org/10.1371/journal.pmed.1001120"
   },
       "Achilles Katamba"
     ],
     "doi": "10.1371/journal.pone.0122574",
+    "year": null,
     "item_type": "journalArticle",
     "url": "https://dx.plos.org/10.1371/journal.pone.0122574"
   },
       "Brittany Moore"
     ],
     "doi": "10.1007/s40258-018-0397-3",
+    "year": null,
     "item_type": "journalArticle",
     "url": "http://link.springer.com/10.1007/s40258-018-0397-3"
   },
       "Charoen Chuchottaworn"
     ],
     "doi": "10.1016/j.vhri.2019.09.010",
+    "year": null,
     "item_type": "journalArticle",
     "url": "https://linkinghub.elsevier.com/retrieve/pii/S221210992030008X"
   },
       "Kevin Schwartzman"
     ],
     "doi": "10.1371/journal.pone.0150119",
+    "year": null,
     "item_type": "journalArticle",
     "url": "https://dx.plos.org/10.1371/journal.pone.0150119"
   },
       "Alemayehu Hailu"
     ],
     "doi": "10.1371/journal.pone.0259056",
+    "year": null,
     "item_type": "journalArticle",
     "url": "https://dx.plos.org/10.1371/journal.pone.0259056"
   },
       "Esther Turunga"
     ],
     "doi": "10.1097/QAI.0000000000002371",
+    "year": null,
     "item_type": "journalArticle",
     "url": "https://journals.lww.com/10.1097/QAI.0000000000002371"
   },
       "Jos\u00e9 Mar\u00eda Ten\u00edas-Burillo"
     ],
     "doi": "10.1016/j.eimc.2016.06.009",
+    "year": null,
     "item_type": "journalArticle",
     "url": "https://linkinghub.elsevier.com/retrieve/pii/S0213005X16301550"
   },
       "Jos\u00e9 Mar\u00eda Ten\u00edas-Burillo"
     ],
     "doi": "10.1016/j.eimc.2016.06.009",
+    "year": null,
     "item_type": "journalArticle",
     "url": "https://linkinghub.elsevier.com/retrieve/pii/S0213005X16301550"
   },
       "Nelson L.S. Lee"
     ],
     "doi": "10.1016/j.jinf.2014.12.015",
+    "year": null,
     "item_type": "journalArticle",
     "url": "https://linkinghub.elsevier.com/retrieve/pii/S016344531500002X"
   }

data/kayongo-papers_zotero_items.json DELETED Viewed

@@ -1,222 +0,0 @@
-[
-  {
-    "key": "UNWR6MI4",
-    "title": "Le\u00e7ons du Rapid Response Service en Ouganda",
-    "abstract": "R\u00e9sum\u00e9 Le Service de r\u00e9ponse rapide (RRS)\u2013en anglais Rapid Reponse Service\u2013est un service d'application de connaissances. Il r\u00e9pond au besoin de donn\u00e9es des d\u00e9cideurs en \u2026",
-    "full_text": "",
-    "authors": [
-      "I Kawooya",
-      "I Ddumba",
-      "E Kayongo",
-      "..."
-    ],
-    "doi": "",
-    "year": null,
-    "item_type": "journalArticle",
-    "url": "https://www.cres-sn.org/wp-content/uploads/2022/03/Ebook-Donnees-probantes.pdf#page=241"
-  },
-  {
-    "key": "QEZLUVIL",
-    "title": "Brain Magnetic Resonance Imaging and Angiography Findings in Ugandan Children with Sickle Cell Anemia; A Cross Sectional Study",
-    "abstract": "Abstract Sickle Cell Anemia (SCA) is a leading cause of childhood stroke in sub-Saharan Africa and sickle cell brain vasculopathy manifests either as overt stroke or clinically\" silent \u2026",
-    "full_text": "",
-    "authors": [
-      "R Idro",
-      "NS Green",
-      "D Munube",
-      "LR Buluma",
-      "B Kebirungi",
-      "..."
-    ],
-    "doi": "",
-    "year": null,
-    "item_type": "journalArticle",
-    "url": "https://ashpublications.org/blood/article/132/Supplement%201/2376/264336"
-  },
-  {
-    "key": "BN43BLJ5",
-    "title": "Accuracy of the chest x-ray in screening for tuberculosis in Uganda: A cross-sectional study.",
-    "abstract": "Abstract ABSTRACT BACKGROUND: The WHO END TB strategy requires\u2265 90% case detection to combat tuberculosis (TB). Increased TB case detection requires a more \u2026",
-    "full_text": "",
-    "authors": [
-      "J Nalunjogi",
-      "F Mugabe",
-      "I Najjingo",
-      "P Lusiba",
-      "F Olweny",
-      "..."
-    ],
-    "doi": "",
-    "year": null,
-    "item_type": "journalArticle",
-    "url": "https://www.researchsquare.com/article/rs-37900/latest.pdf"
-  },
-  {
-    "key": "PF63FYYY",
-    "title": "Rapidly responding to policy queries with evidence: Learning from rapid response services in Uganda",
-    "abstract": "Summary The Rapid Response Service (RRS) is a knowledge translation service in Uganda that responds to a decision maker's needs for evidence with synthesised relevant evidence \u2026",
-    "full_text": "",
-    "authors": [
-      "I Kawooya",
-      "I Ddumba",
-      "E Kayongo",
-      "..."
-    ],
-    "doi": "",
-    "year": null,
-    "item_type": "journalArticle",
-    "url": "https://library.oapen.org/bitstream/handle/20.500.12657/39511/9780367440121_text.pdf?sequence=1#page=159"
-  },
-  {
-    "key": "VXFKNQIN",
-    "title": "Pre-diagnostic drop out of presumptive TB patients and its associated factors at Bugembe Health Centre IV in Jinja, Uganda",
-    "abstract": "Background: Drop out of presumptive TB individuals before making a final diagnosis poses a danger to the individual and their community. We aimed to determine the proportion of \u2026",
-    "full_text": "",
-    "authors": [
-      "G Ekuka",
-      "I Kawooya",
-      "E Kayongo",
-      "R Ssenyonga",
-      "..."
-    ],
-    "doi": "",
-    "year": null,
-    "item_type": "journalArticle",
-    "url": "https://www.ajol.info/index.php/ahs/article/view/197831"
-  },
-  {
-    "key": "KQWSK82P",
-    "title": "Point\u2010of\u2010care diagnostic tests for sickle cell disease",
-    "abstract": "Objectives This is a protocol for a Cochrane Review (diagnostic). The objectives are as follows: To determine the accuracy of point\u2010of\u2010care tests (POCT) to screen sickle cell \u2026",
-    "full_text": "",
-    "authors": [
-      "I Kawooya",
-      "E Kayongo",
-      "D Munube",
-      "..."
-    ],
-    "doi": "10.1002/14651858.CD014584",
-    "year": null,
-    "item_type": "journalArticle",
-    "url": "https://www.cochranelibrary.com/cdsr/doi/10.1002/14651858.CD014584/abstract"
-  },
-  {
-    "key": "8PMU8JR9",
-    "title": "of nodding syndrome",
-    "abstract": "Aims. Nodding syndrome is a poorly understood acquired disorder affecting children in sub-Saharan Africa. The aetiology and pathogenesis are unknown, and no specific treatment is \u2026",
-    "full_text": "",
-    "authors": [
-      "E Kayongo",
-      "N Gumisiriza",
-      "A Lanyero",
-      "..."
-    ],
-    "doi": "",
-    "year": null,
-    "item_type": "journalArticle",
-    "url": "https://pdfs.semanticscholar.org/a0a3/7f6c382fe555492d8640855e31bf233881c0.pdf"
-  },
-  {
-    "key": "AN26LWTD",
-    "title": "Accuracy and incremental yield of the chest X-ray in screening for tuberculosis in Uganda: a cross-sectional study",
-    "abstract": "The WHO END TB strategy requires\u2265 90% case detection to combat tuberculosis (TB). Increased TB case detection requires a more sensitive and specific screening tool \u2026",
-    "full_text": "",
-    "authors": [
-      "J Nalunjogi",
-      "F Mugabe",
-      "I Najjingo",
-      "P Lusiba",
-      "..."
-    ],
-    "doi": "",
-    "year": null,
-    "item_type": "journalArticle",
-    "url": "https://www.hindawi.com/journals/trt/2021/6622809/"
-  },
-  {
-    "key": "MAYC8H5C",
-    "title": "Vulnerability of Populations to Malaria after Indoor Residual Spraying is Withdrawn from Areas where its Use has Previously Been Sustained. Protocol for a Systematic \u2026",
-    "abstract": "Background: With its proven effectiveness, indoor residual spraying (IRS) as a malaria vector control strategy forms one of the reliable vector control strategies, especially when at \u2026",
-    "full_text": "",
-    "authors": [
-      "P Orishaba",
-      "E Kayongo",
-      "P Lusiba",
-      "C Nakalema",
-      "..."
-    ],
-    "doi": "10.1101/2022.05.24.22275507.abstract",
-    "year": null,
-    "item_type": "journalArticle",
-    "url": "https://www.medrxiv.org/content/10.1101/2022.05.24.22275507.abstract"
-  },
-  {
-    "key": "S2FGVY8R",
-    "title": "Asymptomatic malaria parasitaemia and seizure control in children with nodding syndrome; a cross-sectional study",
-    "abstract": "Objective Plasmodium falciparum is epileptogenic and in malaria endemic areas, is a leading cause of acute seizures. In these areas, asymptomatic infections are common but \u2026",
-    "full_text": "",
-    "authors": [
-      "R Ogwang",
-      "R Anguzu",
-      "P Akun",
-      "A Ningwa",
-      "E Kayongo",
-      "..."
-    ],
-    "doi": "",
-    "year": null,
-    "item_type": "journalArticle",
-    "url": "https://bmjopen.bmj.com/content/8/10/e023624.abstract"
-  },
-  {
-    "key": "6KALDEWN",
-    "title": "Adherence to the MDR-TB intensive phase treatment protocol amongst individuals followed up at central and peripheral health care facilities in Uganda-a descriptive \u2026",
-    "abstract": "Background: Following initiation of MDR-TB treatment, patients have a choice to receive follow up DOT supervision at either the central initiating facility or at a peripheral facility \u2026",
-    "full_text": "",
-    "authors": [
-      "J Mukasa",
-      "E Kayongo",
-      "I Kawooya",
-      "D Lukoye",
-      "..."
-    ],
-    "doi": "",
-    "year": null,
-    "item_type": "journalArticle",
-    "url": "https://www.ajol.info/index.php/ahs/article/view/197828"
-  },
-  {
-    "key": "76FY87Z6",
-    "title": "The natural history of nodding syndrome",
-    "abstract": "Aims. Nodding syndrome is a poorly understood acquired disorder affecting children in sub\u2010Saharan Africa. The aetiology and pathogenesis are unknown, and no specific treatment is \u2026",
-    "full_text": "",
-    "authors": [
-      "R Idro",
-      "R Ogwang",
-      "E Kayongo",
-      "N Gumisiriza",
-      "..."
-    ],
-    "doi": "10.1684/epd.2018.1012",
-    "year": null,
-    "item_type": "journalArticle",
-    "url": "https://onlinelibrary.wiley.com/doi/abs/10.1684/epd.2018.1012"
-  },
-  {
-    "key": "TQQ2BYRK",
-    "title": "Paper 1: Demand-driven rapid reviews for health policy and systems decision-making: lessons from Lebanon, Ethiopia, and South Africa on researchers and \u2026",
-    "abstract": "Rapid reviews have emerged as an approach to provide contextualized evidence in a timely and efficient manner. Three rapid review centers were established in Ethiopia, Lebanon \u2026",
-    "full_text": "",
-    "authors": [
-      "RM Mijumbi-Deve",
-      "I Kawooya",
-      "E Kayongo",
-      "R Izizinga",
-      "..."
-    ],
-    "doi": "10.1186/s13643-022-02021-3",
-    "year": null,
-    "item_type": "journalArticle",
-    "url": "https://link.springer.com/article/10.1186/s13643-022-02021-3"
-  }
-]

data/vaccine_coverage_zotero_items.json CHANGED Viewed

@@ -17,7 +17,7 @@
       "Rania A Tohme"
     ],
     "doi": "10.15585/mmwr.mm7229a2",
-    "date": "2023",
     "item_type": "journalArticle",
     "url": ""
   },
@@ -31,7 +31,7 @@
       "Edgar Mugema Mulogo"
     ],
     "doi": "10.21522/TIJPH.2013.09.03.Art019",
-    "date": "2021",
     "item_type": "journalArticle",
     "url": ""
   },
@@ -45,7 +45,7 @@
       "Edgar Mugema Mulogo"
     ],
     "doi": "10.21522/TIJPH.2013.09.04.Art008",
-    "date": "2021",
     "item_type": "journalArticle",
     "url": ""
   },
@@ -89,7 +89,7 @@
       "G. Shapira"
     ],
     "doi": "10.1371/journal.pmed.1004070",
-    "date": "2022",
     "item_type": "journalArticle",
     "url": "https://www.scopus.com/inward/record.uri?eid=2-s2.0-85137126764&doi=10.1371%2fjournal.pmed.1004070&partnerID=40&md5=32f1cd887f5eb46121eb1e48abfcdaaf"
   },
@@ -111,7 +111,7 @@
       "Yahaya Gavamukulya"
     ],
     "doi": "10.1016/j.dib.2019.104269",
-    "date": "2019",
     "item_type": "journalArticle",
     "url": ""
   },
@@ -137,7 +137,7 @@
       "Kirsty Le Doare"
     ],
     "doi": "10.1136/bmjgh-2021-006102",
-    "date": "2021",
     "item_type": "journalArticle",
     "url": "https://search.ebscohost.com/login.aspx?direct=true&db=cmedm&AN=34452941&site=ehost-live&scope=site"
   },
@@ -152,7 +152,7 @@
       "Tsai-Ching Hsu"
     ],
     "doi": "",
-    "date": "2020",
     "item_type": "journalArticle",
     "url": "https://search.ebscohost.com/login.aspx?direct=true&db=a9h&AN=148721705&site=ehost-live&scope=site"
   },
@@ -176,7 +176,7 @@
       "E. M. Mulogo"
     ],
     "doi": "10.1186/s12879-022-07579-w",
-    "date": "2022",
     "item_type": "journalArticle",
     "url": ""
   },
@@ -192,7 +192,7 @@
       "D. Kajungu"
     ],
     "doi": "10.1186/s12913-023-09875-w",
-    "date": "2023",
     "item_type": "journalArticle",
     "url": ""
   },
@@ -210,7 +210,7 @@
       "C. Banura"
     ],
     "doi": "10.1186/s12889-022-13113-z",
-    "date": "2022",
     "item_type": "journalArticle",
     "url": ""
   },
@@ -242,7 +242,7 @@
       "N. Fadl"
     ],
     "doi": "10.1007/s10900-023-01261-1",
-    "date": "2024",
     "item_type": "journalArticle",
     "url": ""
   },
@@ -264,7 +264,7 @@
       "Y. Gavamukulya"
     ],
     "doi": "10.1016/j.dib.2019.104269",
-    "date": "2019",
     "item_type": "journalArticle",
     "url": ""
   },
@@ -286,7 +286,7 @@
       "Y. Gavamukulya"
     ],
     "doi": "10.9734/ijtdh/2019/v39i330209",
-    "date": "2019",
     "item_type": "journalArticle",
     "url": ""
   },
@@ -303,7 +303,7 @@
       "H. W. Reynolds"
     ],
     "doi": "10.3390/vaccines11030647",
-    "date": "2023",
     "item_type": "journalArticle",
     "url": ""
   },
@@ -320,7 +320,7 @@
       "E. Sacks"
     ],
     "doi": "10.1093/heapol/czaa099",
-    "date": "2020",
     "item_type": "journalArticle",
     "url": ""
   },
@@ -341,7 +341,7 @@
       "L. Berman"
     ],
     "doi": "10.3390/vaccines11020375",
-    "date": "2023",
     "item_type": "journalArticle",
     "url": ""
   },
@@ -359,7 +359,7 @@
       "P. Waiswa"
     ],
     "doi": "10.1186/s12913-021-06554-6",
-    "date": "2021",
     "item_type": "journalArticle",
     "url": ""
   },
@@ -378,7 +378,7 @@
       "F. Guillen-Grima"
     ],
     "doi": "10.3390/vaccines11061103",
-    "date": "2023",
     "item_type": "journalArticle",
     "url": ""
   }

       "Rania A Tohme"
     ],
     "doi": "10.15585/mmwr.mm7229a2",
+    "year": null,
     "item_type": "journalArticle",
     "url": ""
   },
       "Edgar Mugema Mulogo"
     ],
     "doi": "10.21522/TIJPH.2013.09.03.Art019",
+    "year": null,
     "item_type": "journalArticle",
     "url": ""
   },
       "Edgar Mugema Mulogo"
     ],
     "doi": "10.21522/TIJPH.2013.09.04.Art008",
+    "year": null,
     "item_type": "journalArticle",
     "url": ""
   },
       "G. Shapira"
     ],
     "doi": "10.1371/journal.pmed.1004070",
+    "year": null,
     "item_type": "journalArticle",
     "url": "https://www.scopus.com/inward/record.uri?eid=2-s2.0-85137126764&doi=10.1371%2fjournal.pmed.1004070&partnerID=40&md5=32f1cd887f5eb46121eb1e48abfcdaaf"
   },
       "Yahaya Gavamukulya"
     ],
     "doi": "10.1016/j.dib.2019.104269",
+    "year": null,
     "item_type": "journalArticle",
     "url": ""
   },
       "Kirsty Le Doare"
     ],
     "doi": "10.1136/bmjgh-2021-006102",
+    "year": null,
     "item_type": "journalArticle",
     "url": "https://search.ebscohost.com/login.aspx?direct=true&db=cmedm&AN=34452941&site=ehost-live&scope=site"
   },
       "Tsai-Ching Hsu"
     ],
     "doi": "",
+    "year": null,
     "item_type": "journalArticle",
     "url": "https://search.ebscohost.com/login.aspx?direct=true&db=a9h&AN=148721705&site=ehost-live&scope=site"
   },
       "E. M. Mulogo"
     ],
     "doi": "10.1186/s12879-022-07579-w",
+    "year": null,
     "item_type": "journalArticle",
     "url": ""
   },
       "D. Kajungu"
     ],
     "doi": "10.1186/s12913-023-09875-w",
+    "year": null,
     "item_type": "journalArticle",
     "url": ""
   },
       "C. Banura"
     ],
     "doi": "10.1186/s12889-022-13113-z",
+    "year": null,
     "item_type": "journalArticle",
     "url": ""
   },
       "N. Fadl"
     ],
     "doi": "10.1007/s10900-023-01261-1",
+    "year": null,
     "item_type": "journalArticle",
     "url": ""
   },
       "Y. Gavamukulya"
     ],
     "doi": "10.1016/j.dib.2019.104269",
+    "year": null,
     "item_type": "journalArticle",
     "url": ""
   },
       "Y. Gavamukulya"
     ],
     "doi": "10.9734/ijtdh/2019/v39i330209",
+    "year": null,
     "item_type": "journalArticle",
     "url": ""
   },
       "H. W. Reynolds"
     ],
     "doi": "10.3390/vaccines11030647",
+    "year": null,
     "item_type": "journalArticle",
     "url": ""
   },
       "E. Sacks"
     ],
     "doi": "10.1093/heapol/czaa099",
+    "year": null,
     "item_type": "journalArticle",
     "url": ""
   },
       "L. Berman"
     ],
     "doi": "10.3390/vaccines11020375",
+    "year": null,
     "item_type": "journalArticle",
     "url": ""
   },
       "P. Waiswa"
     ],
     "doi": "10.1186/s12913-021-06554-6",
+    "year": null,
     "item_type": "journalArticle",
     "url": ""
   },
       "F. Guillen-Grima"
     ],
     "doi": "10.3390/vaccines11061103",
+    "year": null,
     "item_type": "journalArticle",
     "url": ""
   }

data/zotero-collection-pastan_zotero_items.json DELETED Viewed

The diff for this file is too large to render. See raw diff

docs.py DELETED Viewed

@@ -1,13 +0,0 @@
-description = """
-Welcome to the Acres AI RAG API documentation.
-### RAG Tasks
-- Use the `/process_zotero_library_items`: Process zotero library items with your zotero credentials.
-- Use the `/get_study_info`: Get number of documents in a zotero study.
-- Use the `/study_variables`: Get research summary from the study provided the study variables.
-- Use the `/download_csv`: Export the markdown text to a csv file.
-"""
-tags_metadata = [
-    {"name": "ACRES RAG", "description": "AI RAG Application"},
-]

infra/ecs_config.template DELETED Viewed

@@ -1,7 +0,0 @@
-[deploy]
-bucket = 'dev-acres-gradio-bucket'
-region = 'us-east-1'
-stack_name = 'AcresRag'
-[parameters]
-ContainerImageGradio = '224427659xxxx.dkr.ecr.us-east-1.amazonaws.com/gradio-app-prod:latest'

infra/ecs_fargate.yml DELETED Viewed

@@ -1,581 +0,0 @@
-AWSTemplateFormatVersion: '2010-09-09'
-Description: Deploy Gradio and FastAPI services on AWS ECS Fargate
-Parameters:
-  Environment:
-    Type: String
-    Default: dev
-    AllowedValues: [dev, prod]
-  # VPC Configuration
-  VpcCIDR:
-    Type: String
-    Default: 10.0.0.0/16
-  PublicSubnet1CIDR:
-    Type: String
-    Default: 10.0.1.0/24
-  PublicSubnet2CIDR:
-    Type: String
-    Default: 10.0.2.0/24
-  # ECS Configuration
-  ECSClusterName:
-    Type: String
-    Default: rag-ecs-cluster
-  GradioTaskDefinitionCPU:
-    Type: Number
-    Default: 512
-  GradioTaskDefinitionMemory:
-    Type: Number
-    Default: 1024
-  FastAPITaskDefinitionCPU:
-    Type: Number
-    Default: 256
-  FastAPITaskDefinitionMemory:
-    Type: Number
-    Default: 512
-  # Container Images
-  ContainerImageGradio:
-    Type: String
-    Description: URI of the Gradio container image in ECR
-  ContainerImageFastAPI:
-    Type: String
-    Description: URI of the FastAPI container image in ECR
-  # CertificateArn:
-  #   Type: String
-Resources:
-  # VPC and Networking
-  VPC:
-    Type: AWS::EC2::VPC
-    Properties:
-      CidrBlock: !Ref VpcCIDR
-      EnableDnsHostnames: true
-      EnableDnsSupport: true
-      Tags:
-        - Key: Name
-          Value: !Sub ${Environment}-acres-vpc
-  InternetGateway:
-    Type: AWS::EC2::InternetGateway
-    Properties:
-      Tags:
-        - Key: Name
-          Value: !Sub ${Environment}-acres-igw
-  AttachGateway:
-    Type: AWS::EC2::VPCGatewayAttachment
-    Properties:
-      VpcId: !Ref VPC
-      InternetGatewayId: !Ref InternetGateway
-  PublicSubnet1:
-    Type: AWS::EC2::Subnet
-    Properties:
-      VpcId: !Ref VPC
-      AvailabilityZone: !Select [0, !GetAZs '']
-      CidrBlock: !Ref PublicSubnet1CIDR
-      MapPublicIpOnLaunch: true
-      Tags:
-        - Key: Name
-          Value: !Sub ${Environment}-acres-public-subnet-1
-  PublicSubnet2:
-    Type: AWS::EC2::Subnet
-    Properties:
-      VpcId: !Ref VPC
-      AvailabilityZone: !Select [1, !GetAZs '']
-      CidrBlock: !Ref PublicSubnet2CIDR
-      MapPublicIpOnLaunch: true
-      Tags:
-        - Key: Name
-          Value: !Sub ${Environment}-acres-public-subnet-2
-  PublicRouteTable:
-    Type: AWS::EC2::RouteTable
-    Properties:
-      VpcId: !Ref VPC
-      Tags:
-        - Key: Name
-          Value: !Sub ${Environment}-acres-public-rt
-  PublicRoute:
-    Type: AWS::EC2::Route
-    DependsOn: AttachGateway
-    Properties:
-      RouteTableId: !Ref PublicRouteTable
-      DestinationCidrBlock: 0.0.0.0/0
-      GatewayId: !Ref InternetGateway
-  PublicSubnet1RouteTableAssociation:
-    Type: AWS::EC2::SubnetRouteTableAssociation
-    Properties:
-      SubnetId: !Ref PublicSubnet1
-      RouteTableId: !Ref PublicRouteTable
-  PublicSubnet2RouteTableAssociation:
-    Type: AWS::EC2::SubnetRouteTableAssociation
-    Properties:
-      SubnetId: !Ref PublicSubnet2
-      RouteTableId: !Ref PublicRouteTable
-  # Security Groups
-  GradioSecurityGroup:
-    Type: AWS::EC2::SecurityGroup
-    Properties:
-      GroupDescription: Security group for Gradio service
-      VpcId: !Ref VPC
-      SecurityGroupIngress:
-        - IpProtocol: tcp
-          FromPort: 7860
-          ToPort: 7860
-          CidrIp: 0.0.0.0/0
-          Description: INTERNET HTTPS
-        - IpProtocol: tcp
-          FromPort: 80
-          ToPort: 80
-          CidrIp: 0.0.0.0/0
-          Description: INTERNET HTTP
-      SecurityGroupEgress:
-        - IpProtocol: -1
-          CidrIp: 0.0.0.0/0
-  FastAPISecurityGroup:
-    Type: AWS::EC2::SecurityGroup
-    Properties:
-      GroupDescription: Security group for FastAPI service
-      VpcId: !Ref VPC
-      SecurityGroupIngress:
-        - IpProtocol: tcp
-          FromPort: 8000
-          ToPort: 8000
-          CidrIp: 0.0.0.0/0
-          Description: INTERNET HTTPS
-        - IpProtocol: tcp
-          FromPort: 80
-          ToPort: 80
-          CidrIp: 0.0.0.0/0
-          Description: INTERNET HTTP
-      SecurityGroupEgress:
-        - IpProtocol: -1
-          CidrIp: 0.0.0.0/0
-  # IAM Roles and Policies
-  # Gradio Execution Role - for pulling images and logging
-  GradioTaskExecutionRole:
-    Type: AWS::IAM::Role
-    Properties:
-      AssumeRolePolicyDocument:
-        Version: '2012-10-17'
-        Statement:
-          - Effect: Allow
-            Principal:
-              Service: ecs-tasks.amazonaws.com
-            Action: sts:AssumeRole
-      ManagedPolicyArns:
-        - arn:aws:iam::aws:policy/service-role/AmazonECSTaskExecutionRolePolicy
-      Policies:
-        - PolicyName: GradioExecutionPolicy
-          PolicyDocument:
-            Version: '2012-10-17'
-            Statement:
-              - Effect: Allow
-                Action:
-                  - ecr:GetAuthorizationToken
-                  - ecr:BatchCheckLayerAvailability
-                  - ecr:GetDownloadUrlForLayer
-                  - ecr:BatchGetImage
-                Resource: '*'
-              - Effect: Allow
-                Action:
-                  - logs:CreateLogStream
-                  - logs:PutLogEvents
-                Resource:
-                  - !Sub arn:aws:logs:${AWS::Region}:${AWS::AccountId}:log-group:/ecs/${Environment}-acres-gradio:*
-                  - !Sub arn:aws:logs:${AWS::Region}:${AWS::AccountId}:log-group:/ecs/${Environment}-acres-gradio:log-stream:*
-  # Gradio Task Role - for runtime permissions
-  GradioTaskRole:
-    Type: AWS::IAM::Role
-    Properties:
-      AssumeRolePolicyDocument:
-        Version: '2012-10-17'
-        Statement:
-          - Effect: Allow
-            Principal:
-              Service: ecs-tasks.amazonaws.com
-            Action: sts:AssumeRole
-      Policies:
-        - PolicyName: GradioTaskPolicy
-          PolicyDocument:
-            Version: '2012-10-17'
-            Statement:
-              # Add specific permissions needed by your Gradio application at runtime
-              - Effect: Allow
-                Action:
-                  - s3:GetObject
-                  - s3:PutObject
-                Resource: !Sub arn:aws:s3:::${Environment}-acres-gradio-bucket/*
-  # FastAPI Execution Role - for pulling images and logging
-  FastAPITaskExecutionRole:
-    Type: AWS::IAM::Role
-    Properties:
-      AssumeRolePolicyDocument:
-        Version: '2012-10-17'
-        Statement:
-          - Effect: Allow
-            Principal:
-              Service: ecs-tasks.amazonaws.com
-            Action: sts:AssumeRole
-      ManagedPolicyArns:
-        - arn:aws:iam::aws:policy/service-role/AmazonECSTaskExecutionRolePolicy
-      Policies:
-        - PolicyName: FastAPIExecutionPolicy
-          PolicyDocument:
-            Version: '2012-10-17'
-            Statement:
-              - Effect: Allow
-                Action:
-                  - ecr:GetAuthorizationToken
-                  - ecr:BatchCheckLayerAvailability
-                  - ecr:GetDownloadUrlForLayer
-                  - ecr:BatchGetImage
-                Resource: '*'
-              - Effect: Allow
-                Action:
-                  - logs:CreateLogStream
-                  - logs:PutLogEvents
-                Resource:
-                  - !Sub arn:aws:logs:${AWS::Region}:${AWS::AccountId}:log-group:/ecs/${Environment}-acres-fastapi:*
-                  - !Sub arn:aws:logs:${AWS::Region}:${AWS::AccountId}:log-group:/ecs/${Environment}-acres-fastapi:log-stream:*
-  # FastAPI Task Role - for runtime permissions
-  FastAPITaskRole:
-    Type: AWS::IAM::Role
-    Properties:
-      AssumeRolePolicyDocument:
-        Version: '2012-10-17'
-        Statement:
-          - Effect: Allow
-            Principal:
-              Service: ecs-tasks.amazonaws.com
-            Action: sts:AssumeRole
-      Policies:
-        - PolicyName: FastAPITaskPolicy
-          PolicyDocument:
-            Version: '2012-10-17'
-            Statement:
-              # Add specific permissions needed by your FastAPI application at runtime
-              - Effect: Allow
-                Action:
-                  - dynamodb:GetItem
-                  - dynamodb:PutItem
-                  - dynamodb:Query
-                Resource: !Sub arn:aws:dynamodb:${AWS::Region}:${AWS::AccountId}:table/${Environment}-acres-fastapi-table
-              # Allow FastAPI to make HTTP calls to Gradio service
-              - Effect: Allow
-                Action:
-                  - execute-api:Invoke
-                Resource: !Sub arn:aws:execute-api:${AWS::Region}:${AWS::AccountId}:*
-  # ECS Cluster
-  ECSCluster:
-    Type: AWS::ECS::Cluster
-    Properties:
-      ClusterName: !Ref ECSClusterName
-      Tags:
-        - Key: Environment
-          Value: !Ref Environment
-  # Load Balancer for Gradio
-  GradioALB:
-    Type: AWS::ElasticLoadBalancingV2::LoadBalancer
-    Properties:
-      Name: !Sub ${Environment}-acres-gradio-alb
-      Scheme: internet-facing
-      LoadBalancerAttributes:
-        - Key: idle_timeout.timeout_seconds
-          Value: '60'
-      Subnets:
-        - !Ref PublicSubnet1
-        - !Ref PublicSubnet2
-      SecurityGroups:
-        - !Ref GradioSecurityGroup
-  GradioTargetGroup:
-    Type: AWS::ElasticLoadBalancingV2::TargetGroup
-    Properties:
-      HealthCheckEnabled: true
-      HealthCheckIntervalSeconds: 30
-      HealthCheckPath: /
-      HealthCheckPort: 7860
-      HealthCheckTimeoutSeconds: 20
-      HealthyThresholdCount: 2
-      Name: !Sub ${Environment}-acres-gradio-tg
-      Port: 7860
-      Protocol: HTTP
-      TargetType: ip
-      UnhealthyThresholdCount: 5
-      VpcId: !Ref VPC
-      TargetGroupAttributes:
-        - Key: deregistration_delay.timeout_seconds
-          Value: '30'
-  GradioHTTPSListener:
-    # https://docs.aws.amazon.com/AWSCloudFormation/latest/UserGuide/aws-resource-elasticloadbalancingv2-listener.html
-    Type: AWS::ElasticLoadBalancingV2::Listener
-    Properties:
-      DefaultActions:
-        - Type: forward
-          TargetGroupArn: !Ref GradioTargetGroup
-      LoadBalancerArn: !Ref GradioALB
-      # Certificates:
-      #   - CertificateArn: !Ref CertificateArn
-      Port: 7860
-      Protocol: HTTP
-  # GradioHTTPListener:
-  #   # https://docs.aws.amazon.com/AWSCloudFormation/latest/UserGuide/aws-resource-elasticloadbalancingv2-listener.html
-  #   Type: AWS::ElasticLoadBalancingV2::Listener
-  #   Properties:
-  #     Protocol: HTTP
-  #     Port: 80
-  #     LoadBalancerArn: !Ref GradioALB
-  #     DefaultActions:
-  #       - Type: redirect
-  #         RedirectConfig:
-  #           Protocol: "HTTPS"
-  #           Port: 7860
-  #           Host: "#{host}"
-  #           Path: "/#{path}"
-  #           Query: "#{query}"
-  #           StatusCode: "HTTP_301"
-  # Load Balancer for FastAPI
-  FastAPIALB:
-    Type: AWS::ElasticLoadBalancingV2::LoadBalancer
-    Properties:
-      Name: !Sub ${Environment}-acres-fastapi-alb
-      Scheme: internet-facing
-      LoadBalancerAttributes:
-        - Key: idle_timeout.timeout_seconds
-          Value: '60'
-      Subnets:
-        - !Ref PublicSubnet1
-        - !Ref PublicSubnet2
-      SecurityGroups:
-        - !Ref FastAPISecurityGroup
-  FastAPITargetGroup:
-    Type: AWS::ElasticLoadBalancingV2::TargetGroup
-    Properties:
-      HealthCheckEnabled: true
-      HealthCheckIntervalSeconds: 30
-      HealthCheckPath: /docs  # FastAPI's Swagger UI path
-      HealthCheckPort: 8000
-      HealthCheckTimeoutSeconds: 20
-      HealthyThresholdCount: 2
-      Name: !Sub ${Environment}-acres-fastapi-tg
-      Port: 8000
-      Protocol: HTTP
-      TargetType: ip
-      UnhealthyThresholdCount: 5
-      VpcId: !Ref VPC
-      TargetGroupAttributes:
-        - Key: deregistration_delay.timeout_seconds
-          Value: '30'
-  FastAPIHTTPSListener:
-    # https://docs.aws.amazon.com/AWSCloudFormation/latest/UserGuide/aws-resource-elasticloadbalancingv2-listener.html
-    Type: AWS::ElasticLoadBalancingV2::Listener
-    Properties:
-      DefaultActions:
-        - Type: forward
-          TargetGroupArn: !Ref FastAPITargetGroup
-      LoadBalancerArn: !Ref FastAPIALB
-      # Certificates:
-      #   - CertificateArn: !Ref CertificateArn
-      Port: 8000
-      Protocol: HTTP
-  # FastAPIHTTPListener:
-  #   # https://docs.aws.amazon.com/AWSCloudFormation/latest/UserGuide/aws-resource-elasticloadbalancingv2-listener.html
-  #   Type: AWS::ElasticLoadBalancingV2::Listener
-  #   Properties:
-  #     Protocol: HTTP
-  #     Port: 80
-  #     LoadBalancerArn: !Ref FastAPIALB
-  #     DefaultActions:
-  #       - Type: redirect
-  #         RedirectConfig:
-  #           Protocol: "HTTPS"
-  #           Port: 8000
-  #           Host: "#{host}"
-  #           Path: "/#{path}"
-  #           Query: "#{query}"
-  #           StatusCode: "HTTP_301"
-  # ECS Task Definitions
-  GradioTaskDefinition:
-    Type: AWS::ECS::TaskDefinition
-    Properties:
-      Family: !Sub ${Environment}-acres-gradio
-      RequiresCompatibilities:
-        - FARGATE
-      Cpu: !Ref GradioTaskDefinitionCPU
-      Memory: !Ref GradioTaskDefinitionMemory
-      NetworkMode: awsvpc
-      ExecutionRoleArn: !GetAtt GradioTaskExecutionRole.Arn
-      TaskRoleArn: !GetAtt GradioTaskRole.Arn
-      ContainerDefinitions:
-        - Name: gradio
-          Image: !Ref ContainerImageGradio
-          PortMappings:
-            - ContainerPort: 7860
-          LogConfiguration:
-            LogDriver: awslogs
-            Options:
-              awslogs-group: !Ref GradioLogGroup
-              awslogs-region: !Ref AWS::Region
-              awslogs-stream-prefix: gradio
-  FastAPITaskDefinition:
-    Type: AWS::ECS::TaskDefinition
-    Properties:
-      Family: !Sub ${Environment}-acres-fastapi
-      RequiresCompatibilities:
-        - FARGATE
-      Cpu: !Ref FastAPITaskDefinitionCPU
-      Memory: !Ref FastAPITaskDefinitionMemory
-      NetworkMode: awsvpc
-      ExecutionRoleArn: !GetAtt FastAPITaskExecutionRole.Arn
-      TaskRoleArn: !GetAtt FastAPITaskRole.Arn
-      ContainerDefinitions:
-        - Name: fastapi
-          Image: !Ref ContainerImageFastAPI
-          PortMappings:
-            - ContainerPort: 8000
-          Environment:
-            - Name: GRADIO_URL
-              Value: !Sub http://${GradioALB.DNSName}:7860/
-          LogConfiguration:
-            LogDriver: awslogs
-            Options:
-              awslogs-group: !Ref FastAPILogGroup
-              awslogs-region: !Ref AWS::Region
-              awslogs-stream-prefix: fastapi
-  # CloudWatch Log Groups
-  GradioLogGroup:
-    Type: AWS::Logs::LogGroup
-    Properties:
-      LogGroupName: !Sub /ecs/${Environment}-acres-gradio
-      RetentionInDays: 30
-  FastAPILogGroup:
-    Type: AWS::Logs::LogGroup
-    Properties:
-      LogGroupName: !Sub /ecs/${Environment}-acres-fastapi
-      RetentionInDays: 30
-  # ECS Services
-  GradioService:
-    Type: AWS::ECS::Service
-    DependsOn:
-      - GradioHTTPSListener
-      # - GradioHTTPListener
-    Properties:
-      ServiceName: !Sub ${Environment}-acres-gradio
-      Cluster: !Ref ECSCluster
-      TaskDefinition: !Ref GradioTaskDefinition
-      DesiredCount: 1
-      LaunchType: FARGATE
-      HealthCheckGracePeriodSeconds: 180
-      LoadBalancers:
-        - ContainerName: gradio
-          ContainerPort: 7860
-          TargetGroupArn: !Ref GradioTargetGroup
-      NetworkConfiguration:
-        AwsvpcConfiguration:
-          AssignPublicIp: ENABLED
-          SecurityGroups:
-            - !Ref GradioSecurityGroup
-          Subnets:
-            - !Ref PublicSubnet1
-            - !Ref PublicSubnet2
-      DeploymentConfiguration:
-        DeploymentCircuitBreaker:
-          Enable: true
-          Rollback: true
-        MaximumPercent: 200
-        MinimumHealthyPercent: 100
-  FastAPIService:
-    Type: AWS::ECS::Service
-    DependsOn:
-      - GradioService
-      - FastAPIHTTPSListener
-      # - FastAPIHTTPListener
-    Properties:
-      ServiceName: !Sub ${Environment}-acres-fastapi
-      Cluster: !Ref ECSCluster
-      TaskDefinition: !Ref FastAPITaskDefinition
-      DesiredCount: 1
-      LaunchType: FARGATE
-      HealthCheckGracePeriodSeconds: 180
-      LoadBalancers:
-        - ContainerName: fastapi
-          ContainerPort: 8000
-          TargetGroupArn: !Ref FastAPITargetGroup
-      NetworkConfiguration:
-        AwsvpcConfiguration:
-          AssignPublicIp: ENABLED
-          SecurityGroups:
-            - !Ref FastAPISecurityGroup
-          Subnets:
-            - !Ref PublicSubnet1
-            - !Ref PublicSubnet2
-      DeploymentConfiguration:
-        DeploymentCircuitBreaker:
-          Enable: true
-          Rollback: true
-        MaximumPercent: 200
-        MinimumHealthyPercent: 100
-      # Add deployment controller for better rollout control
-      DeploymentController:
-        Type: ECS
-Outputs:
-  VpcId:
-    Description: VPC ID
-    Value: !Ref VPC
-  PublicSubnet1:
-    Description: Public Subnet 1
-    Value: !Ref PublicSubnet1
-  PublicSubnet2:
-    Description: Public Subnet 2
-    Value: !Ref PublicSubnet2
-  GradioServiceUrl:
-    Description: URL for the Gradio service
-    Value: !Sub http://${GradioALB.DNSName}:7860/
-  ECSClusterName:
-    Description: Name of the ECS cluster
-    Value: !Ref ECSCluster
-  GradioServiceName:
-    Description: Name of the Gradio service
-    Value: !GetAtt GradioService.Name
-  FastAPIServiceName:
-    Description: Name of the FastAPI service
-    Value: !GetAtt FastAPIService.Name
-  FastAPIServiceUrl:
-    Description: URL for the FastAPI service
-    Value: !Sub http://${FastAPIALB.DNSName}:8000/

interface.py DELETED Viewed

@@ -1,47 +0,0 @@
-"""
-Gradio interface module for ACRES RAG Platform.
-Defines the UI components and layout.
-"""
-# interface.py
-import gradio as gr
-def create_chat_interface() -> gr.Blocks:
-    """Create the chat interface component."""
-    with gr.Blocks() as chat_interface:
-        with gr.Row():
-            with gr.Column(scale=7):
-                chat_history = gr.Chatbot(
-                    value=[], elem_id="chatbot", height=600, show_label=False
-                )
-            with gr.Column(scale=3):
-                pdf_preview = gr.Image(label="Source Page", height=600)
-        with gr.Row():
-            with gr.Column(scale=8):
-                query_input = gr.Textbox(
-                    show_label=False,
-                    placeholder="Ask a question about your documents...",
-                    container=False,
-                )
-            with gr.Column(scale=2):
-                submit_btn = gr.Button("Send", variant="primary")
-        with gr.Row():
-            pdf_files = gr.File(
-                file_count="multiple", file_types=[".pdf"], label="Upload PDF Files"
-            )
-            collection_name = gr.Textbox(
-                label="Collection Name", placeholder="Name this collection of PDFs..."
-            )
-    return (
-        chat_interface,
-        chat_history,
-        pdf_preview,
-        query_input,
-        submit_btn,
-        pdf_files,
-        collection_name,
-    )

pyproject.toml DELETED Viewed

@@ -1,19 +0,0 @@
-[tool.black]
-include = '\.pyi?$'
-exclude = '''
-/(
-    \.git
-  | \.hg
-  | \.mypy_cache
-  | \.tox
-  | \.venv
-  | env
-  |venv
-  | _build
-  | buck-out
-  | build
-  | dist
-  | migrations
-  |alembic
-)/
-'''

rag/__pycache__/__init__.cpython-311.pyc ADDED Viewed

Binary file (159 Bytes). View file

rag/__pycache__/rag_pipeline.cpython-311.pyc ADDED Viewed

Binary file (5.58 kB). View file

rag/rag_pipeline.py CHANGED Viewed

@@ -1,202 +1,91 @@
-# rag/rag_pipeline.py
 import json
-import logging
-import os
-import re
-from typing import Any, Dict, List, Optional, Tuple
-import chromadb
-from dotenv import load_dotenv
-from llama_index.core import Document, PromptTemplate, VectorStoreIndex
-from llama_index.core.node_parser import SentenceSplitter, SentenceWindowNodeParser
 from llama_index.embeddings.openai import OpenAIEmbedding
 from llama_index.llms.openai import OpenAI
-from llama_index.vector_stores.chroma import ChromaVectorStore
-logging.basicConfig(level=logging.INFO)
-logger = logging.getLogger(__name__)
-load_dotenv()
 class RAGPipeline:
-    def __init__(
-        self,
-        study_json,
-        collection_name="study_files_rag_collection",
-        use_semantic_splitter=False,
-    ):
         self.study_json = study_json
-        self.collection_name = collection_name
         self.use_semantic_splitter = use_semantic_splitter
         self.documents = None
-        self.client = chromadb.Client()
-        self.collection = self.client.get_or_create_collection(self.collection_name)
-        self.embedding_model = OpenAIEmbedding(
-            model_name="text-embedding-ada-002", api_key=os.getenv("OPENAI_API_KEY")
-        )
-        self.is_pdf = self._check_if_pdf_collection()
         self.load_documents()
         self.build_index()
-    def _check_if_pdf_collection(self) -> bool:
-        """Check if this is a PDF collection based on the JSON structure."""
-        try:
-            with open(self.study_json, "r") as f:
-                data = json.load(f)
-                # Check first document for PDF-specific fields
-                if data and isinstance(data, list) and len(data) > 0:
-                    return "pages" in data[0] and "source_file" in data[0]
-            return False
-        except Exception as e:
-            logger.error(f"Error checking collection type: {str(e)}")
-            return False
-    def extract_page_number_from_query(self, query: str) -> int:
-        """Extract page number from query text."""
-        # Look for patterns like "page 3", "p3", "p. 3", etc.
-        patterns = [
-            r"page\s*(\d+)",
-            r"p\.\s*(\d+)",
-            r"p\s*(\d+)",
-            r"pg\.\s*(\d+)",
-            r"pg\s*(\d+)",
-        ]
-        for pattern in patterns:
-            match = re.search(pattern, query.lower())
-            if match:
-                return int(match.group(1))
-        return None
     def load_documents(self):
         if self.documents is None:
             with open(self.study_json, "r") as f:
                 self.data = json.load(f)
             self.documents = []
-            if self.is_pdf:
-                # Handle PDF documents
-                for index, doc_data in enumerate(self.data):
-                    pages = doc_data.get("pages", {})
-                    for page_num, page_content in pages.items():
-                        if isinstance(page_content, dict):
-                            content = page_content.get("text", "")
-                        else:
-                            content = page_content
-                        doc_content = (
-                            f"Title: {doc_data['title']}\n"
-                            f"Page {page_num} Content:\n{content}\n"
-                            f"Authors: {', '.join(doc_data['authors'])}\n"
-                        )
-                        metadata = {
-                            "title": doc_data.get("title"),
-                            "authors": ", ".join(doc_data.get("authors", [])),
-                            "year": doc_data.get("date"),
-                            "source_file": doc_data.get("source_file"),
-                            "page_number": int(page_num),
-                            "total_pages": doc_data.get("page_count"),
-                        }
-                        self.documents.append(
-                            Document(
-                                text=doc_content,
-                                id_=f"doc_{index}_page_{page_num}",
-                                metadata=metadata,
-                            )
-                        )
-            else:
-                # Handle Zotero documents
-                for index, doc_data in enumerate(self.data):
-                    doc_content = (
-                        f"Title: {doc_data.get('title', '')}\n"
-                        f"Abstract: {doc_data.get('abstract', '')}\n"
-                        f"Authors: {', '.join(doc_data.get('authors', []))}\n"
-                    )
-                    metadata = {
-                        "title": doc_data.get("title"),
-                        "authors": ", ".join(doc_data.get("authors", [])),
-                        "year": doc_data.get("date"),
-                        "doi": doc_data.get("doi"),
-                    }
-                    self.documents.append(
-                        Document(
-                            text=doc_content, id_=f"doc_{index}", metadata=metadata
-                        )
-                    )
     def build_index(self):
-        sentence_splitter = SentenceSplitter(chunk_size=2048, chunk_overlap=20)
-        def _split(text: str) -> List[str]:
-            return sentence_splitter.split_text(text)
-        node_parser = SentenceWindowNodeParser.from_defaults(
-            sentence_splitter=_split,
-            window_size=5,
-            window_metadata_key="window",
-            original_text_metadata_key="original_text",
-        )
-        # Parse documents into nodes for embedding
-        nodes = node_parser.get_nodes_from_documents(self.documents)
-        # Initialize ChromaVectorStore with the existing collection
-        vector_store = ChromaVectorStore(chroma_collection=self.collection)
-        # Create the VectorStoreIndex using the ChromaVectorStore
-        self.index = VectorStoreIndex(
-            nodes, vector_store=vector_store, embed_model=self.embedding_model
-        )
     def query(
         self, context: str, prompt_template: PromptTemplate = None
-    ) -> Tuple[str, List[Any]]:
         if prompt_template is None:
             prompt_template = PromptTemplate(
-            "Context information is below.\n"
-            "---------------------\n"
-            "{context_str}\n"
-            "---------------------\n"
-            "Given this information, please answer the question: {query_str}\n"
-            "Follow these guidelines for your response:\n"
-            "1. If the answer contains multiple pieces of information (e.g., author names, dates, statistics), "
-            "present it in a markdown table format.\n"
-            "2. For single piece information or simple answers, respond in a clear sentence.\n"
-            "3. Always cite sources using square brackets for EVERY piece of information, e.g. [1], [2], etc.\n"
-            "4. If the information spans multiple documents or pages, organize it by source.\n"
-            "5. If you're unsure about something, say so rather than making assumptions.\n"
-            "\nFormat tables like this:\n"
-            "| Field | Information | Source |\n"
-            "|-------|-------------|--------|\n"
-            "| Title | Example Title | [1] |\n"
-        )
-        # Extract page number for PDF documents
-        requested_page = (
-            self.extract_page_number_from_query(context) if self.is_pdf else None
-        )
         n_documents = len(self.index.docstore.docs)
-        print(f"n_documents: {n_documents}")
         query_engine = self.index.as_query_engine(
             text_qa_template=prompt_template,
-            similarity_top_k=n_documents if n_documents <= 17 else 15,
             response_mode="tree_summarize",
-            llm=OpenAI(model="gpt-4o-mini", api_key=os.getenv("OPENAI_API_KEY")),
         )
         response = query_engine.query(context)
-        # Debug logging
-        print(f"Response type: {type(response)}")
-        print(f"Has source_nodes: {hasattr(response, 'source_nodes')}")
-        if hasattr(response, 'source_nodes'):
-            print(f"Number of source nodes: {len(response.source_nodes)}")
-        return response.response, getattr(response, 'source_nodes', [])

 import json
+from typing import Dict, Any
+from llama_index.core import Document, VectorStoreIndex
+from llama_index.core.node_parser import SentenceWindowNodeParser, SentenceSplitter
+from llama_index.core import PromptTemplate
+from typing import List
 from llama_index.embeddings.openai import OpenAIEmbedding
 from llama_index.llms.openai import OpenAI
 class RAGPipeline:
+    def __init__(self, study_json, use_semantic_splitter=False):
         self.study_json = study_json
         self.use_semantic_splitter = use_semantic_splitter
         self.documents = None
+        self.index = None
         self.load_documents()
         self.build_index()
     def load_documents(self):
         if self.documents is None:
             with open(self.study_json, "r") as f:
                 self.data = json.load(f)
             self.documents = []
+            for index, doc_data in enumerate(self.data):
+                doc_content = (
+                    f"Title: {doc_data['title']}\n"
+                    f"Abstract: {doc_data['abstract']}\n"
+                    f"Authors: {', '.join(doc_data['authors'])}\n"
+                )
+                metadata = {
+                    "title": doc_data.get("title"),
+                    "authors": doc_data.get("authors", []),
+                    "year": doc_data.get("year"),
+                    "doi": doc_data.get("doi"),
+                }
+                self.documents.append(
+                    Document(text=doc_content, id_=f"doc_{index}", metadata=metadata)
+                )
     def build_index(self):
+        if self.index is None:
+            sentence_splitter = SentenceSplitter(chunk_size=2048, chunk_overlap=20)
+            def _split(text: str) -> List[str]:
+                return sentence_splitter.split_text(text)
+            node_parser = SentenceWindowNodeParser.from_defaults(
+                sentence_splitter=_split,
+                window_size=5,
+                window_metadata_key="window",
+                original_text_metadata_key="original_text",
+            )
+            nodes = node_parser.get_nodes_from_documents(self.documents)
+            self.index = VectorStoreIndex(
+                nodes, embed_model=OpenAIEmbedding(model_name="text-embedding-3-large")
+            )
     def query(
         self, context: str, prompt_template: PromptTemplate = None
+    ) -> Dict[str, Any]:
         if prompt_template is None:
             prompt_template = PromptTemplate(
+                "Context information is below.\n"
+                "---------------------\n"
+                "{context_str}\n"
+                "---------------------\n"
+                "Given this information, please answer the question provided in the context. "
+                "Include all relevant information from the provided context. "
+                "If information comes from multiple sources, please mention all of them. "
+                "If the information is not available in the context, please state that clearly. "
+                "When quoting specific information, please use square brackets to indicate the source, e.g. [1], [2], etc."
+            )
+        # This is a hack to index all the documents in the store :)
         n_documents = len(self.index.docstore.docs)
         query_engine = self.index.as_query_engine(
             text_qa_template=prompt_template,
+            similarity_top_k=n_documents,
             response_mode="tree_summarize",
+            llm=OpenAI(model="gpt-4o-mini"),
         )
         response = query_engine.query(context)
+        return response

rag/rag_pipeline_backup.py DELETED Viewed

@@ -1,93 +0,0 @@
-import json
-from typing import Any, Dict, List
-from llama_index.core import Document, PromptTemplate, VectorStoreIndex
-from llama_index.core.node_parser import SentenceSplitter, SentenceWindowNodeParser
-from llama_index.embeddings.openai import OpenAIEmbedding
-from llama_index.llms.openai import OpenAI
-class RAGPipeline:
-    def __init__(self, study_json, use_semantic_splitter=False):
-        self.study_json = study_json
-        self.use_semantic_splitter = use_semantic_splitter
-        self.documents = None
-        self.index = None
-        self.load_documents()
-        self.build_index()
-    def load_documents(self):
-        if self.documents is None:
-            with open(self.study_json, "r") as f:
-                self.data = json.load(f)
-            self.documents = []
-            for index, doc_data in enumerate(self.data):
-                doc_content = (
-                    f"Title: {doc_data['title']}\n"
-                    f"Abstract: {doc_data['abstract']}\n"
-                    f"Authors: {', '.join(doc_data['authors'])}\n"
-                    # f"full_text: {doc_data['full_text']}"
-                )
-                metadata = {
-                    "title": doc_data.get("title"),
-                    "authors": doc_data.get("authors", []),
-                    "year": doc_data.get("date"),
-                    "doi": doc_data.get("doi"),
-                }
-                self.documents.append(
-                    Document(text=doc_content, id_=f"doc_{index}", metadata=metadata)
-                )
-    def build_index(self):
-        if self.index is None:
-            sentence_splitter = SentenceSplitter(chunk_size=2048, chunk_overlap=20)
-            def _split(text: str) -> List[str]:
-                return sentence_splitter.split_text(text)
-            node_parser = SentenceWindowNodeParser.from_defaults(
-                sentence_splitter=_split,
-                window_size=5,
-                window_metadata_key="window",
-                original_text_metadata_key="original_text",
-            )
-            nodes = node_parser.get_nodes_from_documents(self.documents)
-            self.index = VectorStoreIndex(
-                nodes, embed_model=OpenAIEmbedding(model_name="text-embedding-3-large")
-            )
-    def query(
-        self, context: str, prompt_template: PromptTemplate = None
-    ) -> Dict[str, Any]:
-        if prompt_template is None:
-            prompt_template = PromptTemplate(
-                "Context information is below.\n"
-                "---------------------\n"
-                "{context_str}\n"
-                "---------------------\n"
-                "Given this information, please answer the question: {query_str}\n"
-                "Provide an answer to the question using evidence from the context above. "
-                "Cite sources using square brackets for EVERY piece of information, e.g. [1], [2], etc. "
-                "Even if there's only one source, still include the citation. "
-                "If you're unsure about a source, use [?]. "
-                "Ensure that EVERY statement from the context is properly cited."
-            )
-        # This is a hack to index all the documents in the store :)
-        n_documents = len(self.index.docstore.docs)
-        print(f"n_documents: {n_documents}")
-        query_engine = self.index.as_query_engine(
-            text_qa_template=prompt_template,
-            similarity_top_k=n_documents if n_documents <= 17 else 15,
-            response_mode="tree_summarize",
-            llm=OpenAI(model="gpt-4o-mini"),
-        )
-        response = query_engine.query(context)
-        return response

requirements-dev.txt DELETED Viewed

@@ -1,3 +0,0 @@
-black==24.10.0
-isort==5.13.2
-flake8==7.1.1

requirements.txt CHANGED Viewed

@@ -1,25 +1,6 @@
-# Core dependencies
-chromadb==0.5.20
-fastapi==0.115.5
-gradio==5.6.0
-gradio_client==1.4.3
-nest-asyncio==1.6.0
-openai==1.57.0
-pandas==2.2.3
-pydantic==2.9.2
-python-dotenv
-pyzotero
-python-slugify
-PyMuPDF==1.23.8
-Pillow==10.2.0
-sqlmodel==0.0.22
-cachetools
-# LlamaIndex ecosystem (pinned to compatible versions)
-llama-index-core
-docling
-llama-index-readers-docling
-llama-index-vector-stores-chroma
-llama-index-node-parser-docling
-llama-index-embeddings-openai
-llama-index-llms-openai-like

+fastapi==0.112.2
+gradio
+llama-index
+openai
+pandas
+pydantic

sample_queries.md DELETED Viewed

	@@ -1,2 +0,0 @@
1	- 1. For each of the studies on vaccine coverage, could you create a table that lists the findings from the vaccine coverage studies, incorporating variables such as STUDYID, TITLE, DOIs, YEAR?
2	-

study_files.json DELETED Viewed

@@ -1,13 +0,0 @@
-{
-    "Ebola Virus": "data/ebola-virus_zotero_items.json",
-    "GeneXpert": "data/genexpert_zotero_items.json",
-    "Vaccine coverage": "data/vaccine-coverage_zotero_items.json",
-    "Concept": "data/concept_zotero_items.json",
-    "Zotero Collection Pastan": "data/zotero-collection-pastan_zotero_items.json",
-    "pdf_thequickone": "data/thequickone_20250108_111913_documents.json",
-    "pdf_aforapples": "data/aforapples_20250108_113044_documents.json",
-    "pdf_bforbinance": "data/bforbinance_20250108_114459_documents.json",
-    "pdf_cforcongo": "data/cforcongo_20250108_115233_documents.json",
-    "pdf_hjhj": "data/hjhj_20250108_115714_documents.json",
-    "pdf_schooldropouts": "data/schooldropouts_20250108_140257_documents.json"
-}

utils/__pycache__/__init__.cpython-311.pyc ADDED Viewed

Binary file (161 Bytes). View file

utils/__pycache__/prompts.cpython-311.pyc ADDED Viewed

Binary file (5.68 kB). View file

utils/db.py DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:e165937f30a52640195e2a6ee5a71bcf980f0037e901658ebf813d794332ca6c
-size 5045

utils/helpers.py CHANGED Viewed

@@ -1,247 +1,42 @@
-# utils/helpers.py
-import json
-import os
-from typing import Any, Dict, List
-import chromadb
-from chromadb.api.types import Document
 from llama_index.core import Response
-from rag.rag_pipeline import RAGPipeline
-from utils.prompts import (
-    StudyCharacteristics,
-    VaccineCoverageVariables,
-    structured_follow_up_prompt,
-)
-# Initialize ChromaDB client
-chromadb_client = chromadb.Client()
-def read_study_files(file_path):
-    """
-    Reads a JSON file and returns the parsed JSON data.
-    Args:
-        file_path (str): The path to the JSON file to be read.
-    Returns:
-        dict: The data from the JSON file as a Python dictionary.
-    Raises:
-        FileNotFoundError: If the file is not found at the provided path.
-        json.JSONDecodeError: If the file contents are not valid JSON.
-    Example:
-        Given a JSON file 'study_files.json' with content like:
-        {
-            "Vaccine Coverage": "data/vaccine_coverage_zotero_items.json",
-            "Ebola Virus": "data/ebola_virus_zotero_items.json",
-            "Gene Xpert": "data/gene_xpert_zotero_items.json"
-        }
-        Calling `read_json_file("study_files.json")` will return:
-        {
-            "Vaccine Coverage": "data/vaccine_coverage_zotero_items.json",
-            "Ebola Virus": "data/ebola_virus_zotero_items.json",
-            "Gene Xpert": "data/gene_xpert_zotero_items.json"
-        }
-    """
-    try:
-        with open(file_path, "r") as file:
-            data = json.load(file)
-        return data
-    except FileNotFoundError as e:
-        raise FileNotFoundError(f"The file at path {file_path} was not found.") from e
-    except json.JSONDecodeError as e:
-        raise ValueError(
-            f"The file at path {file_path} does not contain valid JSON."
-        ) from e
-def append_to_study_files(file_path, new_key, new_value):
-    """
-    Appends a new key-value entry to an existing JSON file.
-    Args:
-        file_path (str): The path to the JSON file.
-        new_key (str): The new key to add to the JSON file.
-        new_value (any): The value associated with the new key (can be any valid JSON data type).
-    Raises:
-        FileNotFoundError: If the file is not found at the provided path.
-        json.JSONDecodeError: If the file contents are not valid JSON.
-        IOError: If the file cannot be written.
-    Example:
-        If the file 'study_files.json' initially contains:
-        {
-            "Vaccine Coverage": "data/vaccine_coverage_zotero_items.json",
-            "Ebola Virus": "data/ebola_virus_zotero_items.json"
-        }
-        Calling `append_to_json_file("study_files.json", "Gene Xpert", "data/gene_xpert_zotero_items.json")`
-        will modify the file to:
-        {
-            "Vaccine Coverage": "data/vaccine_coverage_zotero_items.json",
-            "Ebola Virus": "data/ebola_virus_zotero_items.json",
-            "Gene Xpert": "data/gene_xpert_zotero_items.json"
-        }
-    """
-    try:
-        # Read the existing data from the file
-        with open(file_path, "r") as file:
-            data = json.load(file)
-        # Append the new key-value pair to the dictionary
-        data[new_key] = new_value
-        # Write the updated data back to the file
-        with open(file_path, "w") as file:
-            json.dump(data, file, indent=4)  # indent for pretty printing
-    except FileNotFoundError as e:
-        raise FileNotFoundError(f"The file at path {file_path} was not found.") from e
-    except json.JSONDecodeError as e:
-        raise ValueError(
-            f"The file at path {file_path} does not contain valid JSON."
-        ) from e
-    except IOError as e:
-        raise IOError(f"Failed to write to the file at {file_path}.") from e
-def generate_follow_up_questions(
-    rag: RAGPipeline, response: str, query: str, study_name: str
-) -> List[str]:
-    """
-    Generates follow-up questions based on the given RAGPipeline, response, query, and study_name.
-    Args:
-        rag (RAGPipeline): The RAGPipeline object used for generating follow-up questions.
-        response (str): The response to the initial query.
-        query (str): The initial query.
-        study_name (str): The name of the study.
-    Returns:
-        List[str]: A list of generated follow-up questions.
-    Raises:
-        None
-    """
-    # Determine the study type based on the study_name
-    if "Vaccine Coverage" in study_name:
-        study_type = "Vaccine Coverage"
-        key_variables = list(VaccineCoverageVariables.__annotations__.keys())
-    elif "Ebola Virus" in study_name:
-        study_type = "Ebola Virus"
-        key_variables = [
-            "SAMPLE_SIZE",
-            "PLASMA_TYPE",
-            "DOSAGE",
-            "FREQUENCY",
-            "SIDE_EFFECTS",
-            "VIRAL_LOAD_CHANGE",
-            "SURVIVAL_RATE",
-        ]
-    elif "Gene Xpert" in study_name:
-        study_type = "Gene Xpert"
-        key_variables = [
-            "OBJECTIVE",
-            "OUTCOME_MEASURES",
-            "SENSITIVITY",
-            "SPECIFICITY",
-            "COST_COMPARISON",
-            "TURNAROUND_TIME",
-        ]
     else:
-        study_type = "General"
-        key_variables = list(StudyCharacteristics.__annotations__.keys())
-    # Add key variables to the context
-    context = f"Study type: {study_type}\nKey variables to consider: {', '.join(key_variables)}\n\n{response}"
-    follow_up_response = rag.query(
-        structured_follow_up_prompt.format(
-            context_str=context,
-            query_str=query,
-            response_str=response,
-            study_type=study_type,
-        )
-    )
-    questions = follow_up_response.response.strip().split("\n")
-    cleaned_questions = []
-    for q in questions:
-        # Remove leading numbers and periods, and strip whitespace
-        cleaned_q = q.split(". ", 1)[-1].strip()
-        # Ensure the question ends with a question mark
-        if cleaned_q and not cleaned_q.endswith("?"):
-            cleaned_q += "?"
-        if cleaned_q:
-            cleaned_questions.append(f"✨ {cleaned_q}")
-    return cleaned_questions[:3]
-def add_study_files_to_chromadb(file_path: str, collection_name: str):
-    """
-    Reads the study files data from a JSON file and adds it to the specified ChromaDB collection.
-    :param file_path: Path to the JSON file containing study files data.
-    :param collection_name: Name of the ChromaDB collection to store the data.
-    """
-    # Load study files data from JSON file
-    try:
-        with open(file_path, "r") as f:
-            study_files_data = json.load(f)
-    except FileNotFoundError:
-        print(f"File '{file_path}' not found.")
-        return
-    if not study_files_data:
-        return
-    # Get or create the collection in ChromaDB
-    collection = chromadb_client.get_or_create_collection(collection_name)
-    # Prepare lists for ids, texts, and metadata to batch insert
-    ids = []
-    documents = []
-    metadatas = []
-    # Populate lists with data from the JSON file
-    for name, file_path in study_files_data.items():
-        ids.append(name)  # Document ID
-        documents.append("")  # Optional text, can be left empty if not used
-        metadatas.append({"file_path": file_path})  # Metadata with file path
-    # Add documents to the collection in batch
-    collection.add(ids=ids, documents=documents, metadatas=metadatas)
-    print("All study files have been successfully added to ChromaDB.")
-def create_directory(directory_path):
-    """
-    Create a directory.
-    Does not raise an error if the directory already exists.
-    Args:
-        directory_path (str): Path of the directory to create
-    Returns:
-        bool: True if directory was created or already exists, False if creation failed
-    """
-    try:
-        # Use exist_ok=True to prevent error if directory exists
-        os.makedirs(directory_path, exist_ok=True)
-        return True
-    except PermissionError:
-        print(f"Permission denied: Cannot create directory {directory_path}")
-        return False
-    except Exception as e:
-        print(f"An unexpected error occurred: {e}")
-        return False
-if __name__ == "__main__":
-    # Usage example
-    add_study_files_to_chromadb("study_files.json", "study_files_collection")

+from typing import Dict, Any
 from llama_index.core import Response
+def process_response(response: Response) -> Dict[str, Any]:
+    source_nodes = response.source_nodes
+    sources = {}
+    for i, node in enumerate(source_nodes, 1):
+        source = format_source(node.metadata)
+        if source not in sources.values():
+            sources[i] = source
+    markdown_text = response.response + "\n\n### Sources\n\n"
+    raw_text = response.response + "\n\nSources:\n"
+    for i, source in sources.items():
+        markdown_text += f"{i}. {source}\n"
+        raw_text += f"[{i}] {source}\n"
+    return {"markdown": markdown_text, "raw": raw_text, "sources": sources}
+def format_source(metadata: Dict[str, Any]) -> str:
+    authors = metadata.get("authors", "Unknown Author")
+    year = metadata.get("year", "n.d.")
+    title = metadata.get("title", "Untitled")
+    author_list = authors.split(",")
+    if len(author_list) > 2:
+        formatted_authors = f"{author_list[0].strip()} et al."
+    elif len(author_list) == 2:
+        formatted_authors = f"{author_list[0].strip()} and {author_list[1].strip()}"
     else:
+        formatted_authors = author_list[0].strip()
+    year = "n.d." if year is None or year == "None" else str(year)
+    max_title_length = 250
+    if len(title) > max_title_length:
+        title = title[:max_title_length] + "..."
+    return f"{formatted_authors} ({year}). {title}"

utils/pdf_processor.py DELETED Viewed

@@ -1,222 +0,0 @@
-# utils/pdf_processor.py
-"""
-PDF processing module for ACRES RAG Platform.
-Handles PDF file processing, text extraction, and page rendering.
-"""
-import datetime
-import json
-import logging
-import os
-import re
-from typing import Dict, List, Optional
-from llama_index.readers.docling import DoclingReader
-import fitz
-from PIL import Image
-from slugify import slugify
-logger = logging.getLogger(__name__)
-reader = DoclingReader()
-class PDFProcessor:
-    def __init__(self, upload_dir: str = "data/uploads"):
-        """Initialize PDFProcessor with upload directory."""
-        self.upload_dir = upload_dir
-        os.makedirs(upload_dir, exist_ok=True)
-        self.current_page = 0
-    def is_references_page(self, text: str) -> bool:
-        """
-        Check if the page appears to be a references/bibliography page.
-        """
-        # Common section headers for references
-        ref_headers = [
-            r"^references\s*$",
-            r"^bibliography\s*$",
-            r"^works cited\s*$",
-            r"^citations\s*$",
-            r"^cited literature\s*$",
-        ]
-        # Check first few lines of the page
-        first_lines = text.lower().split("\n")[:3]
-        first_block = " ".join(first_lines)
-        # Check for reference headers
-        for header in ref_headers:
-            if re.search(header, first_block, re.IGNORECASE):
-                return True
-        # Check for reference-like patterns (e.g., [1] Author, et al.)
-        ref_patterns = [
-            r"^\[\d+\]",  # [1] style
-            r"^\d+\.",  # 1. style
-            r"^[A-Z][a-z]+,\s+[A-Z]\.",  # Author, I. style
-        ]
-        ref_pattern_count = 0
-        lines = text.split("\n")[:10]  # Check first 10 lines
-        for line in lines:
-            line = line.strip()
-            if any(re.match(pattern, line) for pattern in ref_patterns):
-                ref_pattern_count += 1
-        # If multiple reference-like patterns are found, likely a references page
-        return ref_pattern_count >= 3
-    def detect_references_start(self, doc: fitz.Document) -> Optional[int]:
-        """
-        Detect the page where references section starts.
-        Returns the page number or None if not found.
-        """
-        for page_num in range(len(doc)):
-            page = doc[page_num]
-            text = page.get_text()
-            if self.is_references_page(text):
-                logger.info(f"Detected references section starting at page {page_num}")
-                return page_num
-        return None
-    def process_pdfs(self, file_paths: List[str], collection_name: str) -> str:
-        """Process multiple PDF files and store their content."""
-        processed_docs = []
-        for file_path in file_paths:
-            try:
-                doc_data = self.extract_text_from_pdf(file_path)
-                processed_docs.append(doc_data)
-                logger.info(
-                    f"Successfully processed {file_path} ({doc_data['content_pages']} content pages)"
-                )
-            except Exception as e:
-                logger.error(f"Error processing {file_path}: {str(e)}")
-                continue
-        if not processed_docs:
-            raise ValueError("No documents were successfully processed")
-        # Save to JSON file
-        timestamp = datetime.datetime.now().strftime("%Y%m%d_%H%M%S")
-        output_filename = f"{slugify(collection_name)}_{timestamp}_documents.json"
-        output_path = os.path.join("data", output_filename)
-        # Ensure the data directory exists
-        os.makedirs("data", exist_ok=True)
-        with open(output_path, "w", encoding="utf-8") as f:
-            json.dump(processed_docs, f, indent=2, ensure_ascii=False)
-        logger.info(f"Saved processed documents to {output_path}")
-        return output_path
-    def extract_text_from_pdf(self, file_path: str) -> Dict:
-        """
-        Extract text and metadata from a PDF file using DoclingReader.
-        Maintains accurate page numbers for source citation.
-        """
-        try:
-            # Use DoclingReader for main content extraction
-            reader = DoclingReader()
-            documents = reader.load_data(file_path)
-            text = documents[0].text if documents else ""
-            # Use PyMuPDF to get accurate page count
-            doc = fitz.open(file_path)
-            total_pages = len(doc)
-            # Extract title from document
-            title = os.path.basename(file_path)
-            title_match = re.search(r'#+ (.+?)\n', text)
-            if title_match:
-                title = title_match.group(1).strip()
-            # Extract abstract
-            abstract = ""
-            abstract_match = re.search(r'Abstract:?(.*?)(?=\n\n|Keywords:|$)', text, re.DOTALL | re.IGNORECASE)
-            if abstract_match:
-                abstract = abstract_match.group(1).strip()
-            # Extract authors
-            authors = []
-            author_section = re.search(r'\n(.*?)\n.*?Department', text)
-            if author_section:
-                author_text = author_section.group(1)
-                authors = [a.strip() for a in author_text.split(',') if a.strip()]
-            # Remove references section
-            content = text
-            ref_patterns = [r'\nReferences\n', r'\nBibliography\n', r'\nWorks Cited\n']
-            for pattern in ref_patterns:
-                split_text = re.split(pattern, content, flags=re.IGNORECASE)
-                if len(split_text) > 1:
-                    content = split_text[0]
-                    break
-            # Map content to pages using PyMuPDF for accurate page numbers
-            pages = {}
-            for page_num in range(total_pages):
-                page = doc[page_num]
-                page_text = page.get_text()
-                # Skip if this appears to be a references page
-                if self.is_references_page(page_text):
-                    logger.info(f"Skipping references page {page_num}")
-                    continue
-                # Look for this page's content in the Docling-extracted text
-                # This is a heuristic approach - we look for unique phrases from the page
-                key_phrases = self._get_key_phrases(page_text)
-                page_content = self._find_matching_content(content, key_phrases)
-                if page_content:
-                    pages[str(page_num)] = {
-                        'text': page_content,
-                        'page_number': page_num + 1  # 1-based page numbers for human readability
-                    }
-            # Create structured document with page-aware content
-            document = {
-                "title": title,
-                "authors": authors,
-                "date": "",  # Could be extracted if needed
-                "abstract": abstract,
-                "full_text": content,
-                "source_file": file_path,
-                "pages": pages,
-                "page_count": total_pages,
-                "content_pages": len(pages)  # Number of non-reference pages
-            }
-            doc.close()
-            return document
-        except Exception as e:
-            logger.error(f"Error processing PDF {file_path}: {str(e)}")
-            raise
-    def _get_key_phrases(self, text: str, phrase_length: int = 10) -> List[str]:
-        """Extract key phrases from text for matching."""
-        words = text.split()
-        phrases = []
-        for i in range(0, len(words), phrase_length):
-            phrase = ' '.join(words[i:i + phrase_length])
-            if len(phrase.strip()) > 20:  # Only use substantial phrases
-                phrases.append(phrase)
-        return phrases
-    def _find_matching_content(self, docling_text: str, key_phrases: List[str]) -> Optional[str]:
-        """Find the corresponding content in Docling text using key phrases."""
-        for phrase in key_phrases:
-            if phrase in docling_text:
-                # Find the paragraph or section containing this phrase
-                paragraphs = docling_text.split('\n\n')
-                for para in paragraphs:
-                    if phrase in para:
-                        return para
-        return None

utils/prompts.py CHANGED Viewed

@@ -1,10 +1,7 @@
-# utils/prompts.py
-from typing import List, Optional
 from llama_index.core import PromptTemplate
-from llama_index.core.prompts import PromptTemplate
 from pydantic import BaseModel, Field
 class StudyCharacteristics(BaseModel):
@@ -74,8 +71,18 @@ vaccine_coverage_prompt = PromptTemplate(
 )
 sample_questions = {
-    "Vaccine coverage": [
         "What are the vaccine coverage rates reported in the study?",
         "Are there any reported adverse events following immunization (AEFI)?",
         "How does the study account for different vaccine types or schedules?",
         "Extract and present in a tabular format the following variables for each vaccine coverage study: STUDYID, AUTHOR, YEAR, TITLE, PUBLICATION_TYPE, STUDY_DESIGN, STUDY_AREA_REGION, STUDY_POPULATION, IMMUNISABLE_DISEASE_UNDER_STUDY, ROUTE_OF_VACCINE_ADMINISTRATION, DURATION_OF_STUDY, DURATION_IN_RELATION_TO_COVID19, VACCINE_COVERAGE_RATES, PROPORTION_ADMINISTERED_WITHIN_RECOMMENDED_AGE, IMMUNISATION_UPTAKE, VACCINE_DROP_OUT_RATES, INTENTIONS_TO_VACCINATE, VACCINE_CONFIDENCE, HESITANCY_FACTORS, DEMOGRAPHIC_DIFFERENCES, INTERVENTIONS, EQUITY_CONSIDERATIONS, GEOGRAPHICAL_SCOPE, AEFI, VACCINE_TYPES, and STUDY_COMMENTS.",
@@ -83,21 +90,37 @@ sample_questions = {
     "Ebola Virus": [
         "What is the sample size of the study?",
         "What is the type of plasma used in the study?",
         "What biosafety measures were implemented during the study?",
         "Were there any ethical considerations or challenges reported?",
         "Create a structured table for each Ebola virus study, including the following information: STUDYID, AUTHOR, YEAR, TITLE, PUBLICATION_TYPE, STUDY_DESIGN, STUDY_AREA_REGION, STUDY_POPULATION, SAMPLE_SIZE, PLASMA_TYPE, DOSAGE, FREQUENCY, SIDE_EFFECTS, VIRAL_LOAD_CHANGE, SURVIVAL_RATE, INCLUSION_CRITERIA, EXCLUSION_CRITERIA, SUBGROUP_ANALYSES, FOLLOW_UP_DURATION, LONG_TERM_OUTCOMES, DISEASE_SEVERITY_ASSESSMENT, BIOSAFETY_MEASURES, ETHICAL_CONSIDERATIONS, and STUDY_COMMENTS.",
     ],
-    "GeneXpert": [
         "What is the main objective of the study?",
         "What is the study design?",
         "What disease condition is being studied?",
         "Extract and present in a tabular format the following variables for each Gene Xpert study: STUDYID, AUTHOR, YEAR, TITLE, PUBLICATION_TYPE, STUDY_DESIGN, STUDY_AREA_REGION, STUDY_POPULATION, DISEASE_CONDITION, OBJECTIVE, OUTCOME_MEASURES, SENSITIVITY, SPECIFICITY, COST_COMPARISON, TURNAROUND_TIME, IMPLEMENTATION_CHALLENGES, PERFORMANCE_VARIATIONS, QUALITY_CONTROL, EQUIPMENT_ISSUES, PATIENT_OUTCOME_IMPACT, TRAINING_REQUIREMENTS, SCALABILITY_CONSIDERATIONS, and STUDY_COMMENTS.",
     ],
-    "General": [
-        "What is the main objective of the study?",
-        "What is the study design?",
-        "Extract and present in a tabular format the following variables for each study: STUDYID, AUTHOR, YEAR, TITLE, PUBLICATION_TYPE, STUDY_DESIGN, STUDY_AREA_REGION, STUDY_POPULATION, OBJECTIVE, and STUDY_COMMENTS.",
-    ],
 }
@@ -119,25 +142,5 @@ evidence_based_prompt = PromptTemplate(
     "---------------------\n"
     "Given this information, please answer the question: {query_str}\n"
     "Provide an answer to the question using evidence from the context above. "
-    "Cite sources using square brackets for EVERY piece of information, e.g. [1], [2], etc. "
-    "Even if there's only one source, still include the citation. "
-    "If you're unsure about a source, use [?]. "
-    "Ensure that EVERY statement from the context is properly cited."
-)
-structured_follow_up_prompt = PromptTemplate(
-    "Context information is below.\n"
-    "---------------------\n"
-    "{context_str}\n"
-    "---------------------\n"
-    "Original question: {query_str}\n"
-    "Response: {response_str}\n"
-    "Study type: {study_type}\n"
-    "Based on the above information and the study type, generate 3 follow-up questions that help extract key variables or information from the study. "
-    "Focus on the following aspects:\n"
-    "1. Any missing key variables that are typically reported in this type of study.\n"
-    "2. Clarification on methodology or results that might affect the interpretation of the study.\n"
-    "3. Potential implications or applications of the study findings.\n"
-    "Ensure each question is specific, relevant to the study type, and ends with a question mark."
 )

 from llama_index.core import PromptTemplate
+from typing import Optional, List
 from pydantic import BaseModel, Field
+from llama_index.core.prompts import PromptTemplate
 class StudyCharacteristics(BaseModel):
 )
 sample_questions = {
+    "Vaccine Coverage": [
         "What are the vaccine coverage rates reported in the study?",
+        "What proportion of vaccines were administered within the recommended age range?",
+        "What is the immunisation uptake reported in the study?",
+        "What are the vaccine drop-out rates mentioned in the document?",
+        "What are the intentions to vaccinate reported in the study?",
+        "How is vaccine confidence described in the document?",
+        "What factors influencing vaccine hesitancy are identified in the study?",
+        "Are there any demographic differences in vaccine coverage or uptake?",
+        "What interventions, if any, were implemented to improve vaccine coverage?",
+        "How does the study address equity in vaccine distribution and access?",
+        "What is the geographical scope of the study (e.g., urban, rural, national)?",
         "Are there any reported adverse events following immunization (AEFI)?",
         "How does the study account for different vaccine types or schedules?",
         "Extract and present in a tabular format the following variables for each vaccine coverage study: STUDYID, AUTHOR, YEAR, TITLE, PUBLICATION_TYPE, STUDY_DESIGN, STUDY_AREA_REGION, STUDY_POPULATION, IMMUNISABLE_DISEASE_UNDER_STUDY, ROUTE_OF_VACCINE_ADMINISTRATION, DURATION_OF_STUDY, DURATION_IN_RELATION_TO_COVID19, VACCINE_COVERAGE_RATES, PROPORTION_ADMINISTERED_WITHIN_RECOMMENDED_AGE, IMMUNISATION_UPTAKE, VACCINE_DROP_OUT_RATES, INTENTIONS_TO_VACCINATE, VACCINE_CONFIDENCE, HESITANCY_FACTORS, DEMOGRAPHIC_DIFFERENCES, INTERVENTIONS, EQUITY_CONSIDERATIONS, GEOGRAPHICAL_SCOPE, AEFI, VACCINE_TYPES, and STUDY_COMMENTS.",
     "Ebola Virus": [
         "What is the sample size of the study?",
         "What is the type of plasma used in the study?",
+        "What is the dosage and frequency of administration of the plasma?",
+        "Are there any reported side effects?",
+        "What is the change in viral load after treatment?",
+        "How many survivors were there in the intervention group compared to the control group?",
+        "What was the study design (e.g., RCT, observational)?",
+        "What were the inclusion and exclusion criteria for participants?",
+        "Were there any subgroup analyses performed?",
+        "What was the duration of follow-up?",
+        "Were there any reported long-term outcomes or sequelae?",
+        "How was the severity of Ebola virus disease assessed?",
         "What biosafety measures were implemented during the study?",
         "Were there any ethical considerations or challenges reported?",
         "Create a structured table for each Ebola virus study, including the following information: STUDYID, AUTHOR, YEAR, TITLE, PUBLICATION_TYPE, STUDY_DESIGN, STUDY_AREA_REGION, STUDY_POPULATION, SAMPLE_SIZE, PLASMA_TYPE, DOSAGE, FREQUENCY, SIDE_EFFECTS, VIRAL_LOAD_CHANGE, SURVIVAL_RATE, INCLUSION_CRITERIA, EXCLUSION_CRITERIA, SUBGROUP_ANALYSES, FOLLOW_UP_DURATION, LONG_TERM_OUTCOMES, DISEASE_SEVERITY_ASSESSMENT, BIOSAFETY_MEASURES, ETHICAL_CONSIDERATIONS, and STUDY_COMMENTS.",
     ],
+    "Gene Xpert": [
         "What is the main objective of the study?",
         "What is the study design?",
         "What disease condition is being studied?",
+        "What are the main outcome measures in the study?",
+        "What is the sensitivity and specificity of the Gene Xpert test?",
+        "How does the cost of the Gene Xpert testing strategy compare to other methods?",
+        "What is the turnaround time for Gene Xpert results compared to conventional methods?",
+        "Are there any reported challenges in implementing Gene Xpert in the study setting?",
+        "How does Gene Xpert performance vary across different sample types or patient populations?",
+        "What quality control measures were implemented in the study?",
+        "Were there any reported equipment failures or technical issues?",
+        "How does the study address the impact of Gene Xpert on patient outcomes or clinical decision-making?",
+        "What training or human resource requirements were reported for Gene Xpert implementation?",
+        "How does the study consider the scalability and sustainability of Gene Xpert use?",
         "Extract and present in a tabular format the following variables for each Gene Xpert study: STUDYID, AUTHOR, YEAR, TITLE, PUBLICATION_TYPE, STUDY_DESIGN, STUDY_AREA_REGION, STUDY_POPULATION, DISEASE_CONDITION, OBJECTIVE, OUTCOME_MEASURES, SENSITIVITY, SPECIFICITY, COST_COMPARISON, TURNAROUND_TIME, IMPLEMENTATION_CHALLENGES, PERFORMANCE_VARIATIONS, QUALITY_CONTROL, EQUIPMENT_ISSUES, PATIENT_OUTCOME_IMPACT, TRAINING_REQUIREMENTS, SCALABILITY_CONSIDERATIONS, and STUDY_COMMENTS.",
     ],
 }
     "---------------------\n"
     "Given this information, please answer the question: {query_str}\n"
     "Provide an answer to the question using evidence from the context above. "
+    "Cite sources using square brackets."
 )