Spaces:

matthoffner
/

serp-chat

Paused

App Files Files Community

matt HOFFNER commited on Jun 22, 2023

Commit

054d282

1 Parent(s): 25cad06

revamp

Browse files

Files changed (40) hide show

.gitignore +2 -0
Dockerfile +54 -16
README.md +45 -7
app.py +0 -98
index/docstore.json +0 -1
index/index_store.json +0 -1
index/vector_store.json +0 -1
jsconfig.json +8 -0
llm.py +0 -276
next.config.js +11 -0
overwrites.py +0 -12
package-lock.json +0 -0
package.json +26 -0
postcss.config.js +6 -0
presets.py +0 -29
public/favicon.svg +1 -0
public/spinner.svg +6 -0
requirements.txt +0 -10
src/app/globals.css +17 -0
src/app/head.jsx +10 -0
src/app/layout.jsx +19 -0
src/app/page.jsx +24 -0
src/app/search/error.jsx +15 -0
src/app/search/image/loading.jsx +23 -0
src/app/search/image/page.jsx +36 -0
src/app/search/layout.jsx +12 -0
src/app/search/web/loading.jsx +24 -0
src/app/search/web/page.jsx +36 -0
src/components/CountryLookup.jsx +15 -0
src/components/Footer.jsx +9 -0
src/components/HomeHeader.jsx +10 -0
src/components/HomeSearch.jsx +62 -0
src/components/ImageSearchResults.jsx +37 -0
src/components/PaginationButtons.jsx +37 -0
src/components/SearchBox.jsx +42 -0
src/components/SearchHeader.jsx +33 -0
src/components/SearchHeaderOptions.jsx +25 -0
src/components/WebSearchResults.jsx +31 -0
tailwind.config.js +15 -0
utils.py +0 -57

.gitignore ADDED Viewed

	@@ -0,0 +1,2 @@


1	+ node_modules/
2	+ .next/

Dockerfile CHANGED Viewed

@@ -1,24 +1,62 @@
-FROM nvidia/cuda:11.6.0-base-ubuntu20.04
 WORKDIR /app
-RUN export PATH="/usr/local/cuda/bin:$PATH"
-RUN apt update && \
-    apt install --no-install-recommends -y build-essential python3 python3-pip wget && \
-    apt clean && rm -rf /var/lib/apt/lists/*
-RUN wget -qO- "https://cmake.org/files/v3.17/cmake-3.17.0-Linux-x86_64.tar.gz" | tar --strip-components=1 -xz -C /usr/local
-RUN CMAKE_ARGS="-DLLAMA_CUBLAS=on" FORCE_CMAKE=1 pip install llama-cpp-python --no-cache-dir
-COPY requirements.txt ./
-RUN pip install --upgrade pip && \
-    pip install -r requirements.txt
-EXPOSE 7860
-RUN useradd -m -u 1000 user
-USER user
-COPY --chown=user . $HOME/app
-RUN ls -al
-CMD ["python3", "app.py", "--host", "127.0.0.1", "--port", "7860"]

+FROM node:18 AS base
+# Install dependencies only when needed
+FROM base AS deps
+WORKDIR /app
+# Install dependencies based on the preferred package manager
+COPY package.json yarn.lock* package-lock.json* pnpm-lock.yaml* ./
+RUN \
+  if [ -f yarn.lock ]; then yarn --frozen-lockfile; \
+  elif [ -f package-lock.json ]; then npm ci; \
+  elif [ -f pnpm-lock.yaml ]; then yarn global add pnpm && pnpm i --frozen-lockfile; \
+  else echo "Lockfile not found." && exit 1; \
+  fi
+# Uncomment the following lines if you want to use a secret at buildtime,
+# for example to access your private npm packages
+# RUN --mount=type=secret,id=HF_EXAMPLE_SECRET,mode=0444,required=true \
+#     $(cat /run/secrets/HF_EXAMPLE_SECRET)
+# Rebuild the source code only when needed
+FROM base AS builder
 WORKDIR /app
+COPY --from=deps /app/node_modules ./node_modules
+COPY . .
+# Next.js collects completely anonymous telemetry data about general usage.
+# Learn more here: https://nextjs.org/telemetry
+# Uncomment the following line in case you want to disable telemetry during the build.
+# ENV NEXT_TELEMETRY_DISABLED 1
+# RUN yarn build
+# If you use yarn, comment out this line and use the line above
+RUN npm run build
+# Production image, copy all the files and run next
+FROM base AS runner
+WORKDIR /app
+ENV NODE_ENV production
+# Uncomment the following line in case you want to disable telemetry during runtime.
+# ENV NEXT_TELEMETRY_DISABLED 1
+RUN addgroup --system --gid 1001 nodejs
+RUN adduser --system --uid 1001 nextjs
+COPY --from=builder /app/public ./public
+# Automatically leverage output traces to reduce image size
+# https://nextjs.org/docs/advanced-features/output-file-tracing
+COPY --from=builder --chown=nextjs:nodejs /app/.next/standalone ./
+COPY --from=builder --chown=nextjs:nodejs /app/.next/static ./.next/static
+USER nextjs
+EXPOSE 3000
+ENV PORT 3000
+CMD ["node", "server.js"]

README.md CHANGED Viewed

@@ -1,12 +1,50 @@
 ---
-title: serp-chat
-emoji: 📚🎳
-colorFrom: red
-colorTo: green
 sdk: docker
-app_file: app.py
-port: 7860
 pinned: false
 ---
-# llamacpp-cuda-doc-chat

 ---
+title: new google
+emoji: 📚
+colorFrom: yellow
+colorTo: indigo
 sdk: docker
+app_port: 8000
 pinned: false
 ---
+This is a fork of https://github.com/sahandghavidel/google-clone-nextjs13
+This is a [Next.js](https://nextjs.org/) project bootstrapped with [`create-next-app`](https://github.com/vercel/next.js/tree/canary/packages/create-next-app).
+## Getting Started
+First, run the development server:
+```bash
+npm run dev
+# or
+yarn dev
+# or
+pnpm dev
+```
+Open [http://localhost:3000](http://localhost:3000) with your browser to see the result.
+You can start editing the page by modifying `app/page.js`. The page auto-updates as you edit the file.
+[API routes](https://nextjs.org/docs/api-routes/introduction) can be accessed on [http://localhost:3000/api/hello](http://localhost:3000/api/hello). This endpoint can be edited in `pages/api/hello.js`.
+The `pages/api` directory is mapped to `/api/*`. Files in this directory are treated as [API routes](https://nextjs.org/docs/api-routes/introduction) instead of React pages.
+This project uses [`next/font`](https://nextjs.org/docs/basic-features/font-optimization) to automatically optimize and load Inter, a custom Google Font.
+## Learn More
+To learn more about Next.js, take a look at the following resources:
+- [Next.js Documentation](https://nextjs.org/docs) - learn about Next.js features and API.
+- [Learn Next.js](https://nextjs.org/learn) - an interactive Next.js tutorial.
+You can check out [the Next.js GitHub repository](https://github.com/vercel/next.js/) - your feedback and contributions are welcome!
+## Deploy on Vercel
+The easiest way to deploy your Next.js app is to use the [Vercel Platform](https://vercel.com/new?utm_medium=default-template&filter=next.js&utm_source=create-next-app&utm_campaign=create-next-app-readme) from the creators of Next.js.
+Check out our [Next.js deployment documentation](https://nextjs.org/docs/deployment) for more details.

app.py DELETED Viewed

@@ -1,98 +0,0 @@
-# -*- coding: utf-8 -*-
-import sys
-import gradio as gr
-from llm import *
-from utils import *
-from presets import *
-from overwrites import *
-logging.basicConfig(stream=sys.stdout, level=logging.INFO)
-logging.getLogger().addHandler(logging.StreamHandler(stream=sys.stdout))
-PromptHelper.compact_text_chunks = compact_text_chunks
-with gr.Blocks() as demo:
-    with gr.Box():
-        gr.Markdown("<h1 style='font-size: 48px; text-align: center;'>🪄 WizardLM Doc Chat 📓</h1>")
-    chat_context = gr.State([])
-    new_google_chat_context = gr.State([])
-    with gr.Row():
-        with gr.Column(scale=3):
-            with gr.Box():
-                gr.Markdown("**Indicies**")
-                with gr.Row():
-                    with gr.Column(scale=12):
-                        index_select = gr.Dropdown(choices=refresh_json_list(plain=True), value="index", show_label=False, multiselect=False).style(container=False)
-                    with gr.Column(min_width=30, scale=1):
-                        index_refresh_btn = gr.Button("🔄").style()
-    with gr.Tab("Search"):
-        with gr.Row():
-            with gr.Column(scale=1):
-                chat_tone = gr.Radio(["smart", "concise", "creative"], label="chat_tone", type="index", value="concise")
-            with gr.Column(scale=3):
-                search_options_checkbox = gr.CheckboxGroup(label="Todo: APIs", choices=["📚 Google", "🏡 Porch", "Your API Here"])
-        chatbot = gr.Chatbot()
-        with gr.Row():
-            with gr.Column(min_width=50, scale=1):
-                chat_empty_btn = gr.Button("🧹", variant="secondary")
-            with gr.Column(scale=12):
-                chat_input = gr.Textbox(show_label=False, placeholder="Enter text...").style(container=False)
-            with gr.Column(min_width=50, scale=1):
-                chat_submit_btn = gr.Button("🚀", variant="primary")
-    with gr.Tab("Setting"):
-        with gr.Row():
-            sim_k = gr.Slider(1, 10, 3, step=1, label="similarity_topk", interactive=True, show_label=True)
-            tempurature = gr.Slider(0, 2, 0.5, step=0.1, label="tempurature", interactive=True, show_label=True)
-        with gr.Row():
-            with gr.Column():
-                tmpl_select = gr.Radio(list(prompt_tmpl_dict.keys()), value="Default", label="Prompt", interactive=True)
-                prompt_tmpl = gr.Textbox(value=prompt_tmpl_dict["Default"] ,lines=10, max_lines=40 ,show_label=False)
-            with gr.Column():
-                refine_select = gr.Radio(list(refine_tmpl_dict.keys()), value="Default", label="Refine", interactive=True)
-                refine_tmpl = gr.Textbox(value=refine_tmpl_dict["Default"] ,lines=10, max_lines=40 ,show_label=False)
-    with gr.Tab("Upload"):
-        with gr.Row():
-            with gr.Column():
-                index_type = gr.Dropdown(choices=["GPTVectorStoreIndex"], label="index_type", value="GPTVectorStoreIndex")
-                upload_file = gr.Files(label="upload_file .txt, .pdf, .epub")
-                new_index_name = gr.Textbox(placeholder="new_index_name: ", show_label=False).style(container=False)
-                construct_btn = gr.Button("⚒️ Index", variant="primary")
-            with gr.Row():
-                with gr.Column():
-                    with gr.Row():
-                        max_input_size = gr.Slider(256, 4096, 4096, step=1, label="max_input_size", interactive=True, show_label=True)
-                        num_outputs = gr.Slider(256, 4096, 512, step=1, label="num_outputs", interactive=True, show_label=True)
-                    with gr.Row():
-                        max_chunk_overlap = gr.Slider(0, 100, 20, step=1, label="max_chunk_overlap", interactive=True, show_label=True)
-                        chunk_size_limit = gr.Slider(0, 4096, 0, step=1, label="chunk_size_limit", interactive=True, show_label=True)
-                    with gr.Row():
-                        embedding_limit = gr.Slider(0, 100, 0, step=1, label="embedding_limit", interactive=True, show_label=True)
-                        separator = gr.Textbox(show_label=False, label="separator", placeholder=",", value="", interactive=True)
-                    with gr.Row():
-                        num_children = gr.Slider(2, 100, 10, step=1, label="num_children", interactive=False, show_label=True)
-                        max_keywords_per_chunk = gr.Slider(1, 100, 10, step=1, label="max_keywords_per_chunk", interactive=False, show_label=True)
-    chat_input.submit(chat_ai, [index_select, chat_input, prompt_tmpl, refine_tmpl, sim_k, chat_tone, chat_context, chatbot, search_options_checkbox], [chat_context, chatbot])
-    chat_input.submit(reset_textbox, [], [chat_input])
-    chat_submit_btn.click(chat_ai, [index_select, chat_input, prompt_tmpl, refine_tmpl, sim_k, chat_tone, chat_context, chatbot, search_options_checkbox], [chat_context, chatbot])
-    chat_submit_btn.click(reset_textbox, [], [chat_input])
-    chat_empty_btn.click(lambda: ([], []), None, [chat_context, chatbot])
-    tmpl_select.change(change_prompt_tmpl, [tmpl_select], [prompt_tmpl])
-    refine_select.change(change_refine_tmpl, [refine_select], [refine_tmpl])
-    index_type.change(lock_params, [index_type], [num_children, max_keywords_per_chunk])
-    construct_btn.click(construct_index, [upload_file, new_index_name, index_type, max_input_size, num_outputs, max_chunk_overlap, chunk_size_limit, embedding_limit, separator, num_children], [index_select])
-if __name__ == "__main__":
-    demo.title = "WizardLM Doc Chat"
-    demo.queue().launch(server_name="0.0.0.0", server_port=7860, share=False)

index/docstore.json DELETED Viewed

@@ -1 +0,0 @@

- {"docstore/metadata": {"8ced199c-f95b-4e3f-b257-dada8d54a55d": {"doc_hash": "46058eadd904a825aebbe7837bc99d1470311336dff046005edcbb02ad36a2e0"}, "ec3daf8e-bae2-44d6-8c70-97e5e74ebbb7": {"doc_hash": "56ceb6ae86fb3887dc0939a1f5c4dbfd994304186b817ba021de140315d0c52d"}, "9f1a3e4e-6fe6-4580-85ed-a6c15856c7a2": {"doc_hash": "25aa44f21ebc8354f28021c3daefdc80847660c61d488ce0e7e9892e35444685"}, "6691ff87-c5c6-4e59-b9c6-3257f47b77e1": {"doc_hash": "019db476096b4a9fbc014d71c9634f5d01ad3bf6e51d093ba7f5bcb3f1a6d7a1"}, "c4b8f302-807e-4714-81a6-b0b6cc5a5f55": {"doc_hash": "37e82baffd9bcb78e6fda3645adaf5b647a502b3e8c75f4f9d5fad3adc56e24e"}, "0867d7c0-321a-4248-8d1a-e38083fb8533": {"doc_hash": "c01640a9026941025384be8c763709f29955f54deb80b1f319f3673fff646b39"}, "31d64cd1-61ca-4aa3-b592-4dbdaf74ed8d": {"doc_hash": "86b2375c5e598a26712f2a748d483df9f458f192009b37d41b65e3300a156964"}, "b8b3c21d-2a62-49e6-a62f-53b87cb90f0f": {"doc_hash": "08b5ab8c522e5b8adfc2b738a155ca85335d1f2c2ede00a967f69406c54b37b3"}, "cb4b7053-efcb-4b62-bef8-d401726a49a3": {"doc_hash": "a1adc57df1046c4bab52af9f1ee767ec009c3a41b6d8b4d642ee6099d109e957"}, "65050326-fdf0-421d-8135-003d0277153a": {"doc_hash": "e042c399f010602b6ea30ddd6e02a6e2d2221a35c4f3bc67027169349762c36f"}}, "docstore/data": {"ec3daf8e-bae2-44d6-8c70-97e5e74ebbb7": {"__data__": {"text": "Bitcoin: A Peer-to-Peer Electronic Cash System\n\nSatoshi Nakamoto\nsatoshin@gmx.com\nwww.bitcoin.org\n\nAbstract. A purely peer-to-peer version of electronic cash would allow online \npayments to be sent directly from one party to another without going through a \nfinancial institution. Digital signatures provide part of the solution, but the main \nbenefits are lost if a trusted third party is still required to prevent double-spending. \nWe propose a solution to the double-spending problem using a peer-to-peer network. \nThe network timestamps transactions by hashing them into an ongoing chain of \nhash-based proof-of-work, forming a record that cannot be changed without redoing \nthe proof-of-work. The longest chain not only serves as proof of the sequence of \nevents witnessed, but proof that it came from the largest pool of CPU power. As \nlong as a majority of CPU power is controlled by nodes that are not cooperating to \nattack the network, they'll generate the longest chain and outpace attackers. The \nnetwork itself requires minimal structure. Messages are broadcast on a best effort \nbasis, and nodes can leave and rejoin the network at will, accepting the longest \nproof-of-work chain as proof of what happened while they were gone.\n\n1.\n\nIntroduction\n\nCommerce on the Internet has come to rely almost exclusively on financial institutions serving as \ntrusted third parties to process electronic payments. While the system works well enough for \nmost transactions, it still suffers from the inherent weaknesses of the trust based model. \nCompletely non-reversible transactions are not really possible, since financial institutions cannot \navoid mediating disputes. The cost of mediation increases transaction costs, limiting the \nminimum practical transaction size and cutting off the possibility for small casual transactions, \nand there is a broader cost in the loss of ability to make non-reversible payments for non-\nreversible services. With the possibility of reversal, the need for trust spreads. Merchants must \nbe wary of their customers, hassling them for more information than they would otherwise need. \nA certain percentage of fraud is accepted as unavoidable. These costs and payment uncertainties \ncan be avoided in person by using physical currency, but no mechanism exists to make payments \nover a communications channel without a trusted party.\n\nWhat is needed is an electronic payment system based on cryptographic proof instead of trust, \nallowing any two willing parties to transact directly with each other without the need for a trusted \nthird party. Transactions that are computationally impractical to reverse would protect sellers \nfrom fraud, and routine escrow mechanisms could easily be implemented to protect buyers. In \nthis paper, we propose a solution to the double-spending problem using a peer-to-peer distributed \ntimestamp server to generate computational proof of the chronological order of transactions. The \nsystem is secure as long as honest nodes collectively control more CPU power than any \ncooperating group of attacker nodes.\n\n1\n\n\f\n2. Transactions\n\nWe define an electronic coin as a chain of digital signatures. Each owner transfers the coin to the \nnext by digitally signing a hash of the previous transaction and the public key of the next owner \nand adding these to the end of the coin. A payee can verify the signatures to verify the chain of \nownership.\n\nTransaction\n\nTransaction\n\nTransaction\n\nOwner 1's\nPublic Key\n\nOwner 2's\nPublic Key\n\nOwner", "doc_id": "ec3daf8e-bae2-44d6-8c70-97e5e74ebbb7", "embedding": null, "doc_hash": "56ceb6ae86fb3887dc0939a1f5c4dbfd994304186b817ba021de140315d0c52d", "extra_info": null, "node_info": {"start": 0, "end": 3659}, "relationships": {"1": "8ced199c-f95b-4e3f-b257-dada8d54a55d", "3": "9f1a3e4e-6fe6-4580-85ed-a6c15856c7a2"}}, "__type__": "1"}, "9f1a3e4e-6fe6-4580-85ed-a6c15856c7a2": {"__data__": {"text": "distributed \ntimestamp server to generate computational proof of the chronological order of transactions. The \nsystem is secure as long as honest nodes collectively control more CPU power than any \ncooperating group of attacker nodes.\n\n1\n\n\f\n2. Transactions\n\nWe define an electronic coin as a chain of digital signatures. Each owner transfers the coin to the \nnext by digitally signing a hash of the previous transaction and the public key of the next owner \nand adding these to the end of the coin. A payee can verify the signatures to verify the chain of \nownership.\n\nTransaction\n\nTransaction\n\nTransaction\n\nOwner 1's\nPublic Key\n\nOwner 2's\nPublic Key\n\nOwner 3's\nPublic Key\n\nHash\n\nHash\n\nHash\n\nOwner 0's\nSignature\n\n Verify\n\nS ig n \n\nOwner 1's\nSignature\n\n Verify\n\nS ig n \n\nOwner 2's\nSignature\n\nOwner 1's\nPrivate Key\n\nOwner 2's\nPrivate Key\n\nOwner 3's\nPrivate Key\n\nThe problem of course is the payee can't verify that one of the owners did not double-spend \nthe coin. A common solution is to introduce a trusted central authority, or mint, that checks every \ntransaction for double spending. After each transaction, the coin must be returned to the mint to \nissue a new coin, and only coins issued directly from the mint are trusted not to be double-spent. \nThe problem with this solution is that the fate of the entire money system depends on the \ncompany running the mint, with every transaction having to go through them, just like a bank.\n\nWe need a way for the payee to know that the previous owners did not sign any earlier \ntransactions. For our purposes, the earliest transaction is the one that counts, so we don't care \nabout later attempts to double-spend. The only way to confirm the absence of a transaction is to \nbe aware of all transactions. In the mint based model, the mint was aware of all transactions and \ndecided which arrived first. To accomplish this without a trusted party, transactions must be \npublicly announced [1], and we need a system for participants to agree on a single history of the \norder in which they were received. The payee needs proof that at the time of each transaction, the \nmajority of nodes agreed it was the first received. \n\n3. Timestamp Server\n\nThe solution we propose begins with a timestamp server. A timestamp server works by taking a \nhash of a block of items to be timestamped and widely publishing the hash, such as in a \nnewspaper or Usenet post [2-5]. The timestamp proves that the data must have existed at the \ntime, obviously, in order to get into the hash. Each timestamp includes the previous timestamp in \nits hash, forming a chain, with each additional timestamp reinforcing the ones before it.\n\nHash\n\nHash\n\nBlock\n\nBlock\n\nItem\n\nItem\n\n...\n\nItem\n\nItem\n\n...\n\n2\n\n\f\n4. Proof-of-Work\n\nTo implement a distributed timestamp server on a peer-to-peer basis, we will need to use a proof-\nof-work system similar to Adam Back's Hashcash [6], rather than newspaper or Usenet posts. \nThe proof-of-work involves scanning for a value that when hashed, such as with SHA-256, the \nhash begins with a number of zero bits. The average work required is exponential in the number \nof zero bits required and can be verified by executing a single hash.\n\nFor our timestamp network, we implement the proof-of-work by incrementing a nonce in the \nblock until a value is found that gives the block's hash the required zero bits.", "doc_id": "9f1a3e4e-6fe6-4580-85ed-a6c15856c7a2", "embedding": null, "doc_hash": "25aa44f21ebc8354f28021c3daefdc80847660c61d488ce0e7e9892e35444685", "extra_info": null, "node_info": {"start": 3097, "end": 6575}, "relationships": {"1": "8ced199c-f95b-4e3f-b257-dada8d54a55d", "2": "ec3daf8e-bae2-44d6-8c70-97e5e74ebbb7", "3": "6691ff87-c5c6-4e59-b9c6-3257f47b77e1"}}, "__type__": "1"}, "6691ff87-c5c6-4e59-b9c6-3257f47b77e1": {"__data__": {"text": "Proof-of-Work\n\nTo implement a distributed timestamp server on a peer-to-peer basis, we will need to use a proof-\nof-work system similar to Adam Back's Hashcash [6], rather than newspaper or Usenet posts. \nThe proof-of-work involves scanning for a value that when hashed, such as with SHA-256, the \nhash begins with a number of zero bits. The average work required is exponential in the number \nof zero bits required and can be verified by executing a single hash.\n\nFor our timestamp network, we implement the proof-of-work by incrementing a nonce in the \nblock until a value is found that gives the block's hash the required zero bits. Once the CPU \neffort has been expended to make it satisfy the proof-of-work, the block cannot be changed \nwithout redoing the work. As later blocks are chained after it, the work to change the block \nwould include redoing all the blocks after it.\n\nBlock\n\nBlock\n\nPrev Hash\n\nNonce\n\nPrev Hash\n\nNonce\n\nTx\n\nTx\n\n...\n\nTx\n\nTx\n\n...\n\nThe proof-of-work also solves the problem of determining representation in majority decision \nmaking. If the majority were based on one-IP-address-one-vote, it could be subverted by anyone \nable to allocate many IPs. Proof-of-work is essentially one-CPU-one-vote. The majority \ndecision is represented by the longest chain, which has the greatest proof-of-work effort invested \nin it. If a majority of CPU power is controlled by honest nodes, the honest chain will grow the \nfastest and outpace any competing chains. To modify a past block, an attacker would have to \nredo the proof-of-work of the block and all blocks after it and then catch up with and surpass the \nwork of the honest nodes. We will show later that the probability of a slower attacker catching up \ndiminishes exponentially as subsequent blocks are added.\n\nTo compensate for increasing hardware speed and varying interest in running nodes over time, \nthe proof-of-work difficulty is determined by a moving average targeting an average number of \nblocks per hour. If they're generated too fast, the difficulty increases.\n\n5. Network\n\nThe steps to run the network are as follows:\n\n1) New transactions are broadcast to all nodes.\n2) Each node collects new transactions into a block. \n3) Each node works on finding a difficult proof-of-work for its block.\n4) When a node finds a proof-of-work, it broadcasts the block to all nodes.\n5) Nodes accept the block only if all transactions in it are valid and not already spent.\n6) Nodes express their acceptance of the block by working on creating the next block in the \n\nchain, using the hash of the accepted block as the previous hash.\n\nNodes always consider the longest chain to be the correct one and will keep working on \nextending it. If two nodes broadcast different versions of the next block simultaneously, some \nnodes may receive one or the other first. In that case, they work on the first one they received, \nbut save the other branch in case it becomes longer. The tie will be broken when the next proof-\nof-work is found and one branch becomes longer; the nodes that were working on the other \nbranch will then switch to the longer one.\n\n3\n\n\f\nNew transaction broadcasts do not necessarily need to reach all nodes. As long as they reach \nmany nodes, they will get into a block before long. Block broadcasts are also tolerant of dropped \nmessages. If a node does not receive a block, it will request it when it receives the next block and \nrealizes it missed one.\n\n6.\n\nIncentive\n\nBy convention, the first transaction in a block is a special transaction that starts a new coin owned \nby the creator of the block. This adds an incentive for", "doc_id": "6691ff87-c5c6-4e59-b9c6-3257f47b77e1", "embedding": null, "doc_hash": "019db476096b4a9fbc014d71c9634f5d01ad3bf6e51d093ba7f5bcb3f1a6d7a1", "extra_info": null, "node_info": {"start": 6606, "end": 10280}, "relationships": {"1": "8ced199c-f95b-4e3f-b257-dada8d54a55d", "2": "9f1a3e4e-6fe6-4580-85ed-a6c15856c7a2", "3": "c4b8f302-807e-4714-81a6-b0b6cc5a5f55"}}, "__type__": "1"}, "c4b8f302-807e-4714-81a6-b0b6cc5a5f55": {"__data__": {"text": "save the other branch in case it becomes longer. The tie will be broken when the next proof-\nof-work is found and one branch becomes longer; the nodes that were working on the other \nbranch will then switch to the longer one.\n\n3\n\n\f\nNew transaction broadcasts do not necessarily need to reach all nodes. As long as they reach \nmany nodes, they will get into a block before long. Block broadcasts are also tolerant of dropped \nmessages. If a node does not receive a block, it will request it when it receives the next block and \nrealizes it missed one.\n\n6.\n\nIncentive\n\nBy convention, the first transaction in a block is a special transaction that starts a new coin owned \nby the creator of the block. This adds an incentive for nodes to support the network, and provides \na way to initially distribute coins into circulation, since there is no central authority to issue them. \nThe steady addition of a constant of amount of new coins is analogous to gold miners expending \nresources to add gold to circulation. In our case, it is CPU time and electricity that is expended.\n\nThe incentive can also be funded with transaction fees. If the output value of a transaction is \nless than its input value, the difference is a transaction fee that is added to the incentive value of \nthe block containing the transaction. Once a predetermined number of coins have entered \ncirculation, the incentive can transition entirely to transaction fees and be completely inflation \nfree.\n\nThe incentive may help encourage nodes to stay honest. If a greedy attacker is able to \nassemble more CPU power than all the honest nodes, he would have to choose between using it \nto defraud people by stealing back his payments, or using it to generate new coins. He ought to \nfind it more profitable to play by the rules, such rules that favour him with more new coins than \neveryone else combined, than to undermine the system and the validity of his own wealth.\n\n7. Reclaiming Disk Space\n\nOnce the latest transaction in a coin is buried under enough blocks, the spent transactions before \nit can be discarded to save disk space. To facilitate this without breaking the block's hash, \ntransactions are hashed in a Merkle Tree [7][2][5], with only the root included in the block's hash. \nOld blocks can then be compacted by stubbing off branches of the tree. The interior hashes do \nnot need to be stored.\n\nBlock\n\nBlock Header (Block Hash)\n\nBlock\n\nBlock Header (Block Hash)\n\nPrev Hash\n\nNonce\n\nPrev Hash\n\nNonce\n\nRoot Hash\n\nRoot Hash\n\nHash01\n\nHash23\n\nHash01\n\nHash23\n\nHash0\n\nHash1\n\nHash2\n\nHash3\n\nHash2\n\nHash3\n\nTx0\n\nTx1\n\nTx2\n\nTx3\n\nTx3\n\nTransactions Hashed in a Merkle Tree\n\nAfter Pruning Tx0-2 from the Block\n\nA block header with no transactions would be about 80 bytes. If we suppose blocks are \ngenerated every 10 minutes, 80 bytes * 6 * 24 * 365 = 4.2MB per year. With computer systems \ntypically selling with 2GB of RAM as of 2008, and Moore's Law predicting current growth of \n1.2GB per year, storage should not be a problem even if the block headers must be kept in \nmemory.\n\n4\n\n\f\n8.\n\nSimplified Payment Verification\n\nIt is possible to verify payments without running a full network node. A user only needs to keep \na copy of the block headers of the longest proof-of-work chain, which he can get by querying \nnetwork nodes until he's convinced he has the longest chain, and obtain", "doc_id": "c4b8f302-807e-4714-81a6-b0b6cc5a5f55", "embedding": null, "doc_hash": "37e82baffd9bcb78e6fda3645adaf5b647a502b3e8c75f4f9d5fad3adc56e24e", "extra_info": null, "node_info": {"start": 10213, "end": 13672}, "relationships": {"1": "8ced199c-f95b-4e3f-b257-dada8d54a55d", "2": "6691ff87-c5c6-4e59-b9c6-3257f47b77e1", "3": "0867d7c0-321a-4248-8d1a-e38083fb8533"}}, "__type__": "1"}, "0867d7c0-321a-4248-8d1a-e38083fb8533": {"__data__": {"text": "would be about 80 bytes. If we suppose blocks are \ngenerated every 10 minutes, 80 bytes * 6 * 24 * 365 = 4.2MB per year. With computer systems \ntypically selling with 2GB of RAM as of 2008, and Moore's Law predicting current growth of \n1.2GB per year, storage should not be a problem even if the block headers must be kept in \nmemory.\n\n4\n\n\f\n8.\n\nSimplified Payment Verification\n\nIt is possible to verify payments without running a full network node. A user only needs to keep \na copy of the block headers of the longest proof-of-work chain, which he can get by querying \nnetwork nodes until he's convinced he has the longest chain, and obtain the Merkle branch \nlinking the transaction to the block it's timestamped in. He can't check the transaction for \nhimself, but by linking it to a place in the chain, he can see that a network node has accepted it, \nand blocks added after it further confirm the network has accepted it.\n\nLongest Proof-of-Work Chain\n\nBlock Header\n\nBlock Header\n\nBlock Header\n\nPrev Hash\n\nNonce\n\nPrev Hash\n\nNonce\n\nPrev Hash\n\nNonce\n\nMerkle Root\n\nMerkle Root\n\nMerkle Root\n\nHash01\n\nHash23\n\nMerkle Branch for Tx3\n\nHash2\n\nHash3\n\nTx3\n\nAs such, the verification is reliable as long as honest nodes control the network, but is more \nvulnerable if the network is overpowered by an attacker. While network nodes can verify \ntransactions for themselves, the simplified method can be fooled by an attacker's fabricated \ntransactions for as long as the attacker can continue to overpower the network. One strategy to \nprotect against this would be to accept alerts from network nodes when they detect an invalid \nblock, prompting the user's software to download the full block and alerted transactions to \nconfirm the inconsistency. Businesses that receive frequent payments will probably still want to \nrun their own nodes for more independent security and quicker verification.\n\n9. Combining and Splitting Value\n\nAlthough it would be possible to handle coins individually, it would be unwieldy to make a \nseparate transaction for every cent in a transfer. To allow value to be split and combined, \ntransactions contain multiple inputs and outputs. Normally there will be either a single input \nfrom a larger previous transaction or multiple inputs combining smaller amounts, and at most two \noutputs: one for the payment, and one returning the change, if any, back to the sender. \n\nTransaction\n\nOut\n\n...\n\nIn\n\nIn\n\n...\n\nIt should be noted that fan-out, where a transaction depends on several transactions, and those \ntransactions depend on many more, is not a problem here. There is never the need to extract a \ncomplete standalone copy of a transaction's history.\n\n5\n\n\f\n10. Privacy\n\nThe traditional banking model achieves a level of privacy by limiting access to information to the \nparties involved and the trusted third party. The necessity to announce all transactions publicly \nprecludes this method, but privacy can still be maintained by breaking the flow of information in \nanother place: by keeping public keys anonymous. The public can see that someone is sending \nan amount to someone else, but without information linking the transaction to anyone. This is \nsimilar to the", "doc_id": "0867d7c0-321a-4248-8d1a-e38083fb8533", "embedding": null, "doc_hash": "c01640a9026941025384be8c763709f29955f54deb80b1f319f3673fff646b39", "extra_info": null, "node_info": {"start": 13744, "end": 17120}, "relationships": {"1": "8ced199c-f95b-4e3f-b257-dada8d54a55d", "2": "c4b8f302-807e-4714-81a6-b0b6cc5a5f55", "3": "31d64cd1-61ca-4aa3-b592-4dbdaf74ed8d"}}, "__type__": "1"}, "31d64cd1-61ca-4aa3-b592-4dbdaf74ed8d": {"__data__": {"text": "should be noted that fan-out, where a transaction depends on several transactions, and those \ntransactions depend on many more, is not a problem here. There is never the need to extract a \ncomplete standalone copy of a transaction's history.\n\n5\n\n\f\n10. Privacy\n\nThe traditional banking model achieves a level of privacy by limiting access to information to the \nparties involved and the trusted third party. The necessity to announce all transactions publicly \nprecludes this method, but privacy can still be maintained by breaking the flow of information in \nanother place: by keeping public keys anonymous. The public can see that someone is sending \nan amount to someone else, but without information linking the transaction to anyone. This is \nsimilar to the level of information released by stock exchanges, where the time and size of \nindividual trades, the \"tape\", is made public, but without telling who the parties were.\n\nTraditional Privacy Model\n\nIdentities\n\nTransactions\n\nTrusted\nThird Party\n\nCounterparty\n\nPublic\n\nNew Privacy Model\n\nIdentities\n\nTransactions\n\nPublic\n\nAs an additional firewall, a new key pair should be used for each transaction to keep them \nfrom being linked to a common owner. Some linking is still unavoidable with multi-input \ntransactions, which necessarily reveal that their inputs were owned by the same owner. The risk \nis that if the owner of a key is revealed, linking could reveal other transactions that belonged to \nthe same owner.\n\n11. Calculations\n\nWe consider the scenario of an attacker trying to generate an alternate chain faster than the honest \nchain. Even if this is accomplished, it does not throw the system open to arbitrary changes, such \nas creating value out of thin air or taking money that never belonged to the attacker. Nodes are \nnot going to accept an invalid transaction as payment, and honest nodes will never accept a block \ncontaining them. An attacker can only try to change one of his own transactions to take back \nmoney he recently spent.\n\nThe race between the honest chain and an attacker chain can be characterized as a Binomial \nRandom Walk. The success event is the honest chain being extended by one block, increasing its \nlead by +1, and the failure event is the attacker's chain being extended by one block, reducing the \ngap by -1.\n\nThe probability of an attacker catching up from a given deficit is analogous to a Gambler's \nRuin problem. Suppose a gambler with unlimited credit starts at a deficit and plays potentially an \ninfinite number of trials to try to reach breakeven. We can calculate the probability he ever \nreaches breakeven, or that an attacker ever catches up with the honest chain, as follows [8]:\n\np = probability an honest node finds the next block\nq = probability the attacker finds the next block\nqz = probability the attacker will ever catch up from z blocks behind\n\nq z={ 1\n\n\ue09eq / p\ue09fz\n\nif p\u2264q\n\nif p\ue085q}\n\n6\n\n\f\nGiven our assumption that p > q, the probability drops exponentially as the number of blocks the \nattacker has to catch up with increases. With the odds against him, if he doesn't make a lucky \nlunge forward early on, his chances become vanishingly small as he falls further behind.\n\nWe now consider how long the recipient of a new transaction needs to wait before being \nsufficiently certain the sender can't change the transaction. We assume the sender is an attacker \nwho wants to make the recipient believe he paid him for a while, then switch it to pay back to \nhimself after some time has passed. The receiver will be alerted when that happens, but the \nsender hopes it will be too late.\n\nThe receiver generates a new key pair and gives the", "doc_id": "31d64cd1-61ca-4aa3-b592-4dbdaf74ed8d", "embedding": null, "doc_hash": "86b2375c5e598a26712f2a748d483df9f458f192009b37d41b65e3300a156964", "extra_info": null, "node_info": {"start": 17007, "end": 20730}, "relationships": {"1": "8ced199c-f95b-4e3f-b257-dada8d54a55d", "2": "0867d7c0-321a-4248-8d1a-e38083fb8533", "3": "b8b3c21d-2a62-49e6-a62f-53b87cb90f0f"}}, "__type__": "1"}, "b8b3c21d-2a62-49e6-a62f-53b87cb90f0f": {"__data__": {"text": "our assumption that p > q, the probability drops exponentially as the number of blocks the \nattacker has to catch up with increases. With the odds against him, if he doesn't make a lucky \nlunge forward early on, his chances become vanishingly small as he falls further behind.\n\nWe now consider how long the recipient of a new transaction needs to wait before being \nsufficiently certain the sender can't change the transaction. We assume the sender is an attacker \nwho wants to make the recipient believe he paid him for a while, then switch it to pay back to \nhimself after some time has passed. The receiver will be alerted when that happens, but the \nsender hopes it will be too late.\n\nThe receiver generates a new key pair and gives the public key to the sender shortly before \nsigning. This prevents the sender from preparing a chain of blocks ahead of time by working on \nit continuously until he is lucky enough to get far enough ahead, then executing the transaction at \nthat moment. Once the transaction is sent, the dishonest sender starts working in secret on a \nparallel chain containing an alternate version of his transaction.\n\nThe recipient waits until the transaction has been added to a block and z blocks have been \nlinked after it. He doesn't know the exact amount of progress the attacker has made, but \nassuming the honest blocks took the average expected time per block, the attacker's potential \nprogress will be a Poisson distribution with expected value:\n\n\ue0c1=z\n\nq\np\n\nTo get the probability the attacker could still catch up now, we multiply the Poisson density for \neach amount of progress he could have made by the probability he could catch up from that point:\n\n\u221e \ue0c1k e\u2212\ue0c1\n\u2211\nk !\n\nk =0\n\n\u22c5{\ue09eq / p\ue09f\ue09e z\u2212k \ue09f\n\n1\n\nif k \u2264 z\n\nif k \ue085 z}\n\nRearranging to avoid summing the infinite tail of the distribution...\n\n1\u2212\u2211\n\nz \ue0c1k e\u2212\ue0c1\nk!\n\nk =0\n\n\ue09e1\u2212\ue09eq / p\ue09f\ue09e z\u2212 k \ue09f\ue09f\n\nConverting to C code...\n\n#include <math.h>\ndouble AttackerSuccessProbability(double q, int z)\n{\n double p = 1.0 - q;\n double lambda = z * (q / p);\n double sum = 1.0;\n int i, k;\n for (k = 0; k <= z; k++)\n {\n double poisson = exp(-lambda);\n for (i = 1; i <= k; i++)\n poisson *= lambda / i;\n sum -= poisson * (1 - pow(q / p, z - k));\n }\n return sum;\n}\n\n7\n\n\f\nRunning some results, we can see the probability drop off exponentially with z.\n\nq=0.1\nz=0 P=1.0000000\nz=1 P=0.2045873\nz=2 P=0.0509779\nz=3 P=0.0131722\nz=4 P=0.0034552\nz=5 P=0.0009137\nz=6 P=0.0002428\nz=7 P=0.0000647\nz=8 P=0.0000173\nz=9 P=0.0000046\nz=10 P=0.0000012\n\nq=0.3\nz=0 P=1.0000000\nz=5 P=0.1773523\nz=10 ", "doc_id": "b8b3c21d-2a62-49e6-a62f-53b87cb90f0f", "embedding": null, "doc_hash": "08b5ab8c522e5b8adfc2b738a155ca85335d1f2c2ede00a967f69406c54b37b3", "extra_info": null, "node_info": {"start": 20764, "end": 23431}, "relationships": {"1": "8ced199c-f95b-4e3f-b257-dada8d54a55d", "2": "31d64cd1-61ca-4aa3-b592-4dbdaf74ed8d", "3": "cb4b7053-efcb-4b62-bef8-d401726a49a3"}}, "__type__": "1"}, "cb4b7053-efcb-4b62-bef8-d401726a49a3": {"__data__": {"text": "off exponentially with z.\n\nq=0.1\nz=0 P=1.0000000\nz=1 P=0.2045873\nz=2 P=0.0509779\nz=3 P=0.0131722\nz=4 P=0.0034552\nz=5 P=0.0009137\nz=6 P=0.0002428\nz=7 P=0.0000647\nz=8 P=0.0000173\nz=9 P=0.0000046\nz=10 P=0.0000012\n\nq=0.3\nz=0 P=1.0000000\nz=5 P=0.1773523\nz=10 P=0.0416605\nz=15 P=0.0101008\nz=20 P=0.0024804\nz=25 P=0.0006132\nz=30 P=0.0001522\nz=35 P=0.0000379\nz=40 P=0.0000095\nz=45 P=0.0000024\nz=50 P=0.0000006\n\nSolving for P less than 0.1%...\n\nP < 0.001\nq=0.10 z=5\nq=0.15 z=8\nq=0.20 z=11\nq=0.25 z=15\nq=0.30 z=24\nq=0.35 z=41\nq=0.40 z=89\nq=0.45 z=340\n\n12. Conclusion\n\nWe have proposed a system for electronic transactions without relying on trust. We started with \nthe usual framework of coins made from digital signatures, which provides strong control of \nownership, but is incomplete without a way to prevent double-spending. To solve this, we \nproposed a peer-to-peer network using proof-of-work to record a public history of transactions \nthat quickly becomes computationally impractical for an attacker to change if honest nodes \ncontrol a majority of CPU power. The network is robust in its unstructured simplicity. Nodes \nwork all at once with little coordination. They do not need to be identified, since messages are \nnot routed to any particular place and only need to be delivered on a best effort basis. Nodes can \nleave and rejoin the network at will, accepting the proof-of-work chain as proof of what \nhappened while they were gone. They vote with their CPU power, expressing their acceptance of \nvalid blocks by working on extending them and rejecting invalid blocks by refusing to work on \nthem. Any needed rules and incentives can be enforced with this consensus mechanism.\n\n8\n\n\f\nReferences\n\n[1] W. Dai, \"b-money,\" http://www.weidai.com/bmoney.txt, 1998.\n\n[2] H. Massias, X.S. Avila, and J.-J. Quisquater, \"Design of a secure timestamping service with minimal \n\ntrust requirements,\" In 20th Symposium on Information Theory in the Benelux, May 1999.\n\n[3] S. Haber, W.S. Stornetta, \"How to time-stamp a digital document,\" In Journal of Cryptology, vol 3, no \n\n2, pages 99-111, 1991.\n\n[4] D. Bayer, S. Haber, W.S. Stornetta, \"Improving the efficiency and reliability of digital time-stamping,\" \nIn Sequences II: Methods in Communication, Security and Computer Science, pages 329-334, 1993.\n\n[5] S. Haber, W.S. Stornetta, \"Secure names for bit-strings,\" In Proceedings of the", "doc_id": "cb4b7053-efcb-4b62-bef8-d401726a49a3", "embedding": null, "doc_hash": "a1adc57df1046c4bab52af9f1ee767ec009c3a41b6d8b4d642ee6099d109e957", "extra_info": null, "node_info": {"start": 23806, "end": 26344}, "relationships": {"1": "8ced199c-f95b-4e3f-b257-dada8d54a55d", "2": "b8b3c21d-2a62-49e6-a62f-53b87cb90f0f", "3": "65050326-fdf0-421d-8135-003d0277153a"}}, "__type__": "1"}, "65050326-fdf0-421d-8135-003d0277153a": {"__data__": {"text": "Massias, X.S. Avila, and J.-J. Quisquater, \"Design of a secure timestamping service with minimal \n\ntrust requirements,\" In 20th Symposium on Information Theory in the Benelux, May 1999.\n\n[3] S. Haber, W.S. Stornetta, \"How to time-stamp a digital document,\" In Journal of Cryptology, vol 3, no \n\n2, pages 99-111, 1991.\n\n[4] D. Bayer, S. Haber, W.S. Stornetta, \"Improving the efficiency and reliability of digital time-stamping,\" \nIn Sequences II: Methods in Communication, Security and Computer Science, pages 329-334, 1993.\n\n[5] S. Haber, W.S. Stornetta, \"Secure names for bit-strings,\" In Proceedings of the 4th ACM Conference \n\non Computer and Communications Security, pages 28-35, April 1997.\n\n[6] A. Back, \"Hashcash - a denial of service counter-measure,\" \nhttp://www.hashcash.org/papers/hashcash.pdf, 2002.\n\n[7] R.C. Merkle, \"Protocols for public key cryptosystems,\" In Proc. 1980 Symposium on Security and \n\nPrivacy, IEEE Computer Society, pages 122-133, April 1980.\n\n[8] W. Feller, \"An introduction to probability theory and its applications,\" 1957.\n\n9\n\n\f", "doc_id": "65050326-fdf0-421d-8135-003d0277153a", "embedding": null, "doc_hash": "e042c399f010602b6ea30ddd6e02a6e2d2221a35c4f3bc67027169349762c36f", "extra_info": null, "node_info": {"start": 25973, "end": 27035}, "relationships": {"1": "8ced199c-f95b-4e3f-b257-dada8d54a55d", "2": "cb4b7053-efcb-4b62-bef8-d401726a49a3"}}, "__type__": "1"}}}

index/index_store.json DELETED Viewed

@@ -1 +0,0 @@

- {"index_store/data": {"7f82bee6-1192-4ff9-9732-1eaadb062490": {"__type__": "list", "__data__": {"index_id": "7f82bee6-1192-4ff9-9732-1eaadb062490", "summary": null, "nodes": ["ec3daf8e-bae2-44d6-8c70-97e5e74ebbb7", "9f1a3e4e-6fe6-4580-85ed-a6c15856c7a2", "6691ff87-c5c6-4e59-b9c6-3257f47b77e1", "c4b8f302-807e-4714-81a6-b0b6cc5a5f55", "0867d7c0-321a-4248-8d1a-e38083fb8533", "31d64cd1-61ca-4aa3-b592-4dbdaf74ed8d", "b8b3c21d-2a62-49e6-a62f-53b87cb90f0f", "cb4b7053-efcb-4b62-bef8-d401726a49a3", "65050326-fdf0-421d-8135-003d0277153a"]}}}}

index/vector_store.json DELETED Viewed

	@@ -1 +0,0 @@
1	- {"embedding_dict": {}, "text_id_to_doc_id": {}}

jsconfig.json ADDED Viewed

	@@ -0,0 +1,8 @@

+{
+  "compilerOptions": {
+    "baseUrl": ".",
+    "paths": {
+      "@/*": ["./src/*"]
+    }
+  }
+}

llm.py DELETED Viewed

@@ -1,276 +0,0 @@
-import os
-from langchain.llms import LlamaCpp
-from llama_index import (
-    GPTVectorStoreIndex,
-    GPTListIndex,
-    ServiceContext,
-    ResponseSynthesizer,
-    LangchainEmbedding
-)
-from langchain.embeddings import HuggingFaceEmbeddings
-from llama_index import download_loader, StorageContext, load_index_from_storage
-from llama_index import (
-    Document,
-    LLMPredictor,
-    PromptHelper
-)
-from llama_index.indices.postprocessor import SimilarityPostprocessor
-from llama_index.query_engine import RetrieverQueryEngine
-from llama_index.storage.index_store import SimpleIndexStore
-from llama_index.storage.docstore import SimpleDocumentStore
-from llama_index.storage.storage_context import SimpleVectorStore
-from googlesearch import search as google_search
-from utils import *
-import logging
-import argparse
-model_path = "wizardLM-7B.ggmlv3.q4_0.bin"
-def query_llm(index, prompt, service_context, retriever_mode='embedding', response_mode='compact'):
-    response_synthesizer = ResponseSynthesizer.from_args(
-        service_context=service_context,
-        node_postprocessors=[
-            SimilarityPostprocessor(similarity_cutoff=0.7)
-        ]
-    )
-    retriever = index.as_retriever(retriever_mode=retriever_mode, service_context=service_context)
-    query_engine = RetrieverQueryEngine.from_args(retriever, response_synthesizer=response_synthesizer, response_mode=response_mode,  service_context=service_context)
-    return query_engine.query(prompt)
-def get_documents(file_src):
-    documents = []
-    logging.debug("Loading documents...")
-    print(f"file_src: {file_src}")
-    for file in file_src:
-        if type(file) == str:
-            print(f"file: {file}")
-            if "http" in file:
-                logging.debug("Loading web page...")
-                BeautifulSoupWebReader = download_loader("BeautifulSoupWebReader")
-                loader = BeautifulSoupWebReader()
-                documents += loader.load_data([file])
-        else:
-            logging.debug(f"file: {file.name}")
-            if os.path.splitext(file.name)[1] == ".pdf":
-                logging.debug("Loading PDF...")
-                CJKPDFReader = download_loader("CJKPDFReader")
-                loader = CJKPDFReader()
-                documents += loader.load_data(file=file.name)
-            else:
-                logging.debug("Loading text file...")
-                with open(file.name, "r", encoding="utf-8") as f:
-                    text = add_space(f.read())
-                    documents += [Document(text)]
-    return documents
-def construct_index(
-    file_src,
-    index_name,
-    index_type,
-    max_input_size=2048,
-    num_outputs=2048,
-    max_chunk_overlap=20,
-    chunk_size_limit=None,
-    embedding_limit=None,
-    separator=" ",
-    num_children=10,
-    max_keywords_per_chunk=10
-):
-    chunk_size_limit = None if chunk_size_limit == 0 else chunk_size_limit
-    embedding_limit = None if embedding_limit == 0 else embedding_limit
-    separator = " " if separator == "" else separator
-    llm = LlamaCpp(
-        model_path=model_path,
-        n_ctx=2048,
-        use_mlock=True,
-        n_parts=-1,
-        temperature=0.7,
-        top_p=0.40,
-        last_n_tokens_size=100,
-        n_threads=8,
-        f16_kv=True,
-        max_tokens=150
-    )
-    llm_predictor = LLMPredictor(
-        llm=llm
-    )
-    prompt_helper = PromptHelper(
-        max_input_size,
-        num_outputs,
-        max_chunk_overlap,
-        embedding_limit,
-        chunk_size_limit,
-        separator=separator,
-    )
-    service_context = ServiceContext.from_defaults(llm_predictor=llm_predictor, prompt_helper=prompt_helper)
-    documents = get_documents(file_src)
-    try:
-        if index_type == "_GPTVectorStoreIndex":
-            index = GPTVectorStoreIndex.from_documents(documents, service_context=service_context)
-        else:
-            index = GPTListIndex.from_documents(documents, service_context=service_context)
-        index.storage_context.persist(persist_dir="./index")
-    except Exception as e:
-        print(e)
-        return None
-    newlist = refresh_json_list(plain=True)
-    return gr.Dropdown.update(choices=newlist, value=index_name)
-def chat_ai(
-    index_select,
-    question,
-    prompt_tmpl,
-    refine_tmpl,
-    sim_k,
-    chat_tone,
-    context,
-    chatbot,
-    search_mode=[],
-):
-    if index_select == "search" and search_mode==[]:
-        chatbot.append((question, "❗search"))
-        return context, chatbot
-    logging.info(f"Question: {question}")
-    temprature = 2 if chat_tone == 0 else 1 if chat_tone == 1 else 0.5
-    if search_mode:
-        index_select = search_construct(question, search_mode, index_select)
-    logging.debug(f"Index: {index_select}")
-    response = ask_ai(
-        index_select,
-        question,
-        prompt_tmpl,
-        refine_tmpl,
-        sim_k,
-        temprature,
-        context
-    )
-    print(response)
-    if response is None:
-        response = "Please upload a document first"
-    response = parse_text(response)
-    context.append({"role": "user", "content": question})
-    context.append({"role": "assistant", "content": response})
-    chatbot.append((question, response))
-    return context, chatbot
-def ask_ai(
-    index_select,
-    question,
-    prompt_tmpl,
-    refine_tmpl,
-    sim_k=1,
-    temprature=0,
-    prefix_messages=[]
-):
-    logging.debug("Querying index...")
-    prompt_helper = PromptHelper(
-        4096,
-        150,
-        -20000
-    )
-    llm = LlamaCpp(model_path=model_path,
-        n_ctx=2048,
-        use_mlock=True,
-        n_parts=-1,
-        temperature=temprature,
-        top_p=0.40,
-        last_n_tokens_size=100,
-        n_threads=4,
-        f16_kv=True,
-        max_tokens=200,
-        n_gpu_layers=40
-    )
-    embeddings = HuggingFaceEmbeddings(model_kwargs={"device": "cuda"})
-    embed_model = LangchainEmbedding(embeddings)
-    llm_predictor = LLMPredictor(
-        llm=llm
-    )
-    service_context = ServiceContext.from_defaults(llm_predictor=llm_predictor, embed_model=embed_model, prompt_helper=prompt_helper)
-    response = None
-    logging.debug("Using GPTVectorStoreIndex")
-    storage_context = StorageContext.from_defaults(
-        docstore=SimpleDocumentStore.from_persist_dir(persist_dir="./index"),
-        vector_store=SimpleVectorStore.from_persist_dir(persist_dir="./index"),
-        index_store=SimpleIndexStore.from_persist_dir(persist_dir="./index"),
-    )
-    if storage_context is not None:
-        index = load_index_from_storage(service_context=service_context, storage_context=storage_context)
-        response = query_llm(index, question, service_context)
-    if response is not None:
-        logging.info(f"Response: {response}")
-        ret_text = response.response
-        return ret_text
-    else:
-        logging.debug("No response found, returning None")
-        return None
-def search_construct(question, search_mode, index_select):
-    print(f"You asked: {question}")
-    llm = LlamaCpp(model_path=model_path,
-        n_ctx=400,
-        use_mlock=True,
-        n_parts=-1,
-        temperature=1,
-        top_p=0.40,
-        last_n_tokens_size=100,
-        n_threads=6,
-        f16_kv=True,
-        max_tokens=100
-    )
-    chat = llm
-    search_terms = (
-        chat.generate(
-            [
-                f"Please extract search terms from the user’s question. The search terms is a concise sentence, which will be searched on Google to obtain relevant information to answer the user’s question, too generalized search terms doesn’t help. Please provide no more than two search terms. Please provide the most relevant search terms only, the search terms should directly correspond to the user’s question. Please separate different search items with commas, with no quote marks. The user’s question is: {question}"
-            ]
-        )
-        .generations[0][0]
-        .text.strip()
-    )
-    search_terms = search_terms.replace('"', "")
-    search_terms = search_terms.replace(".", "")
-    links = []
-    for keywords in search_terms.split(","):
-        keywords = keywords.strip()
-        for search_engine in search_mode:
-            if "Google" in search_engine:
-                print(f"Googling: {keywords}")
-                search_iter = google_search(keywords, num_results=5)
-                links += [next(search_iter) for _ in range(10)]
-            if "Manual" in search_engine:
-                print(f"Searching manually: {keywords}")
-                print("Please input links manually. (Enter 'q' to quit.)")
-                while True:
-                    link = input("Enter link：\n")
-                    if link == "q":
-                        break
-                    else:
-                        links.append(link)
-    links = list(set(links))
-    if len(links) == 0:
-        return index_select
-    print("Extracting data from links...")
-    print("\n".join(links))
-    search_index_name = " ".join(search_terms.split(","))
-    construct_index(links, search_index_name, "GPTVectorStoreIndex")
-    print(f"Index {search_index_name} constructed.")
-    return search_index_name + "_GPTVectorStoreIndex"

next.config.js ADDED Viewed

	@@ -0,0 +1,11 @@

+/** @type {import('next').NextConfig} */
+const nextConfig = {
+  experimental: {
+    appDir: true,
+  },
+  images: {
+    domains: ["upload.wikimedia.org"],
+  },
+};
+module.exports = nextConfig;

overwrites.py DELETED Viewed

@@ -1,12 +0,0 @@
-from llama_index import Prompt
-from typing import List
-import logging
-def compact_text_chunks(self, prompt: Prompt, text_chunks: List[str]) -> List[str]:
-    logging.debug("Compacting text chunks...🚀🚀🚀")
-    combined_str = [c.strip() for c in text_chunks if c.strip()]
-    combined_str = [f"[{index+1}] {c}" for index, c in enumerate(combined_str)]
-    combined_str = "\n\n".join(combined_str)
-    # resplit based on self.max_chunk_overlap
-    text_splitter = self.get_text_splitter_given_prompt(prompt, 1, padding=1)
-    return text_splitter.split_text(combined_str)

package-lock.json ADDED Viewed

The diff for this file is too large to render. See raw diff

package.json ADDED Viewed

	@@ -0,0 +1,26 @@

+{
+  "name": "google-clone-nextjs13",
+  "version": "0.1.0",
+  "private": true,
+  "scripts": {
+    "dev": "next dev",
+    "build": "next build",
+    "start": "next start",
+    "lint": "next lint"
+  },
+  "dependencies": {
+    "@next/font": "13.1.6",
+    "eslint": "8.34.0",
+    "eslint-config-next": "13.1.6",
+    "html-react-parser": "^3.0.9",
+    "next": "13.1.6",
+    "react": "18.2.0",
+    "react-dom": "18.2.0",
+    "react-icons": "^4.7.1"
+  },
+  "devDependencies": {
+    "autoprefixer": "^10.4.13",
+    "postcss": "^8.4.21",
+    "tailwindcss": "^3.2.7"
+  }
+}

postcss.config.js ADDED Viewed

	@@ -0,0 +1,6 @@

+module.exports = {
+  plugins: {
+    tailwindcss: {},
+    autoprefixer: {},
+  },
+}

presets.py DELETED Viewed

@@ -1,29 +0,0 @@
-prompt_tmpl_dict = {
-"Default":
-"""\
-Context information is below.
----------------------
-{context_str}
----------------------
-Using the provided context information, write a comprehensive reply to the given query.
-Make sure to cite results using [number] notation after the reference.
-If the provided context information refer to multiple subjects with the same name, write separate answers for each subject.
-Use prior knowledge only if the given context didn't provide enough information.
-Answer the question: {query_str}
-"""
-}
-refine_tmpl_dict = {
-"Default":
-"""\
-The original question is as follows: {query_str}
-We have provided an existing answer: {existing_answer}
-We have the opportunity to refine the existing answer
-(only if needed) with some more context below.
-------------
-{context_msg}
-------------
-Given the new context, refine the original answer to better
-If the context isn't useful, return the original answer.
-"""
-}

public/favicon.svg ADDED Viewed

public/spinner.svg ADDED Viewed

requirements.txt DELETED Viewed

@@ -1,10 +0,0 @@
-gradio
-llama_index
-langchain
-googlesearch-python
-llama-cpp-python
-IPython
-transformers
-sentence-transformers
---extra-index-url https://download.pytorch.org/whl/cu113
-torch

src/app/globals.css ADDED Viewed

	@@ -0,0 +1,17 @@

+@tailwind base;
+@tailwind components;
+@tailwind utilities;
+@layer components {
+  .btn {
+    @apply bg-[#f8f9fa] rounded-md text-sm text-gray-800 hover:ring-1 hover:ring-gray-200 focus:outline-none active:ring-gray-300 hover:shadow-md w-36 h-10 transition-shadow;
+  }
+  .link {
+    @apply hover:underline cursor-pointer;
+  }
+  .header-icon{
+    @apply bg-transparent hover:bg-gray-200 p-2 text-4xl rounded-full cursor-pointer
+  }
+}

src/app/head.jsx ADDED Viewed

	@@ -0,0 +1,10 @@

+export default function Head() {
+  return (
+    <>
+      <title>Google Clone Next js 13</title>
+      <meta content="width=device-width, initial-scale=1" name="viewport" />
+      <meta name="description" content="Google clone created by Next js 13" />
+      <link rel="icon" href="/favicon.svg" />
+    </>
+  )
+}

src/app/layout.jsx ADDED Viewed

	@@ -0,0 +1,19 @@

+import Footer from "@/components/Footer";
+import "./globals.css";
+export default function RootLayout({ children }) {
+  return (
+    <html lang="en">
+      {/*
+        <head /> will contain the components returned by the nearest parent
+        head.js. Find out more at https://beta.nextjs.org/docs/api-reference/file-conventions/head
+      */}
+      <body className="relative min-h-screen">
+        {children}
+        {/* Footer */}
+        <Footer />
+      </body>
+    </html>
+  );
+}

src/app/page.jsx ADDED Viewed

	@@ -0,0 +1,24 @@

+import HomeHeader from "@/components/HomeHeader";
+import HomeSearch from "@/components/HomeSearch";
+import Image from "next/image";
+export default function Home() {
+  return (
+    <>
+      {/* Header */}
+      <HomeHeader />
+      {/* body */}
+      <div className="flex flex-col items-center mt-24">
+        <Image
+          width="300"
+          height="100"
+          src="https://upload.wikimedia.org/wikinews/en/archive/0/0c/20050620003808%21Google_logo_png.png"
+        />
+        <HomeSearch/>
+      </div>
+    </>
+  );
+}

src/app/search/error.jsx ADDED Viewed

	@@ -0,0 +1,15 @@

+"use client";
+import { useEffect } from "react";
+export default function Error({ error, reset }) {
+  useEffect(() => {
+    console.log("Error: ", error);
+  }, [error]);
+  return (
+    <div className="flex flex-col justify-center items-center pt-10">
+      <h1 className="text-3xl mb-4">Something went wrong</h1>
+      <button className="text-blue-500" onClick={() => reset()}>Try again</button>
+    </div>
+  );
+}

src/app/search/image/loading.jsx ADDED Viewed

	@@ -0,0 +1,23 @@

+export default function loading() {
+  return (
+    <div className="pt-10 mx-2 lg:pl-52 max-w-6xl flex sm:space-x-4 flex-col sm:flex-row pb-42">
+      <div className="animate-pulse">
+        <div className="h-48 w-48 mb-4 bg-gray-200 rounded-md"></div>
+        <div className="h-2 w-48 mb-2.5 bg-gray-200 rounded-md"></div>
+        <div className="h-2 w-44 mb-2.5 bg-gray-200 rounded-md"></div>
+      </div>
+      <div className="hidden sm:inline-flex sm:space-x-4">
+        <div className="animate-pulse">
+          <div className="h-48 w-48 mb-4 bg-gray-200 rounded-md"></div>
+          <div className="h-2 w-48 mb-2.5 bg-gray-200 rounded-md"></div>
+          <div className="h-2 w-44 mb-2.5 bg-gray-200 rounded-md"></div>
+        </div>
+        <div className="animate-pulse">
+          <div className="h-48 w-48 mb-4 bg-gray-200 rounded-md"></div>
+          <div className="h-2 w-48 mb-2.5 bg-gray-200 rounded-md"></div>
+          <div className="h-2 w-44 mb-2.5 bg-gray-200 rounded-md"></div>
+        </div>
+      </div>
+    </div>
+  );
+}

src/app/search/image/page.jsx ADDED Viewed

	@@ -0,0 +1,36 @@

+export const dynamic = "force-dynamic";
+import ImageSearchResults from "@/components/ImageSearchResults";
+import Link from "next/link";
+export default async function ImageSearchPage({ searchParams }) {
+  const startIndex = searchParams.start || "1";
+  await new Promise((resolve) => setTimeout(resolve, 2000));
+  const response = await fetch(
+    `https://www.googleapis.com/customsearch/v1?key=${process.env.API_KEY}&cx=${process.env.CONTEXT_KEY}&q=${searchParams.searchTerm}}&searchType=image&start=${startIndex}`
+  );
+  if (!response.ok) {
+    console.log(response);
+    throw new Error("Something went wrong");
+  }
+  const data = await response.json();
+  const results = data.items;
+  if (!results) {
+    return (
+      <div className="flex flex-col justify-center items-center pt-10">
+        <h1 className="text-3xl mb-4">No results found</h1>
+        <p className="text-lg">
+          Try searching for something else or go back to the homepage{" "}
+          <Link href="/" className="text-blue-500">
+            Home
+          </Link>
+        </p>
+      </div>
+    );
+  }
+  return <>{results && <ImageSearchResults results={data} />}</>;
+}

src/app/search/layout.jsx ADDED Viewed

	@@ -0,0 +1,12 @@

+import SearchHeader from "@/components/SearchHeader";
+import "./../globals.css";
+export default function SearchLayout({ children }) {
+  return (
+    <div>
+      <SearchHeader />
+      {children}
+      {/* Footer */}
+    </div>
+  );
+}

src/app/search/web/loading.jsx ADDED Viewed

	@@ -0,0 +1,24 @@

+export default function loading() {
+  return (
+    <>
+        <div className="mx-2 pt-10 max-w-6xl lg:pl-52 animate-pulse">
+            <div className="h-2.5 w-48 bg-gray-200 rounded-full mb-2.5"></div>
+            <div className="h-3.5 max-w-[360px] bg-gray-200 rounded-full mb-2.5"></div>
+            <div className="h-2 max-w-[560px] bg-gray-200 rounded-full mb-2.5"></div>
+            <div className="h-2 max-w-[530px] bg-gray-200 rounded-full mb-2.5"></div>
+        </div>
+        <div className="mx-2 pt-10 max-w-6xl lg:pl-52 animate-pulse">
+            <div className="h-2.5 w-48 bg-gray-200 rounded-full mb-2.5"></div>
+            <div className="h-3.5 max-w-[360px] bg-gray-200 rounded-full mb-2.5"></div>
+            <div className="h-2 max-w-[560px] bg-gray-200 rounded-full mb-2.5"></div>
+            <div className="h-2 max-w-[530px] bg-gray-200 rounded-full mb-2.5"></div>
+        </div>
+        <div className="mx-2 pt-10 max-w-6xl lg:pl-52 animate-pulse">
+            <div className="h-2.5 w-48 bg-gray-200 rounded-full mb-2.5"></div>
+            <div className="h-3.5 max-w-[360px] bg-gray-200 rounded-full mb-2.5"></div>
+            <div className="h-2 max-w-[560px] bg-gray-200 rounded-full mb-2.5"></div>
+            <div className="h-2 max-w-[530px] bg-gray-200 rounded-full mb-2.5"></div>
+        </div>
+    </>
+  )
+}

src/app/search/web/page.jsx ADDED Viewed

	@@ -0,0 +1,36 @@

+export const dynamic = "force-dynamic";
+import WebSearchResults from "@/components/WebSearchResults";
+import Link from "next/link";
+export default async function WebSearchPage({ searchParams }) {
+  const startIndex = searchParams.start || "1";
+  await new Promise((resolve) => setTimeout(resolve, 2000));
+  const response = await fetch(
+    `https://www.googleapis.com/customsearch/v1?key=${process.env.API_KEY}&cx=${process.env.CONTEXT_KEY}&q=${searchParams.searchTerm}}&start=${startIndex}`
+  );
+  if (!response.ok) {
+    console.log(response);
+    throw new Error("Something went wrong");
+  }
+  const data = await response.json();
+  const results = data.items;
+  if (!results) {
+    return (
+      <div className="flex flex-col justify-center items-center pt-10">
+        <h1 className="text-3xl mb-4">No results found</h1>
+        <p className="text-lg">
+          Try searching for something else or go back to the homepage{" "}
+          <Link href="/" className="text-blue-500">
+            Home
+          </Link>
+        </p>
+      </div>
+    );
+  }
+  return <>{results && <WebSearchResults results={data} />}</>;
+}

src/components/CountryLookup.jsx ADDED Viewed

	@@ -0,0 +1,15 @@

+"use client";
+import { useEffect, useState } from "react";
+export default function CountryLookup() {
+  const [country, setCountry] = useState("United States");
+  useEffect(() => {
+    fetch(
+      `https://extreme-ip-lookup.com/json/?key=${process.env.NEXT_PUBLIC_IP_API_KEY}`
+    )
+      .then((res) => res.json())
+      .then((data) => setCountry(data.country));
+  }, []);
+  return <div>{country}</div>;
+}

src/components/Footer.jsx ADDED Viewed

	@@ -0,0 +1,9 @@

+import CountryLookup from "./CountryLookup";
+export default function Footer() {
+  return (
+    <footer className="absolute bottom-0 text-sm text-gray-500 bg-[#f2f2f2] w-full">
+    </footer>
+  );
+}

src/components/HomeHeader.jsx ADDED Viewed

	@@ -0,0 +1,10 @@

+import Link from "next/link";
+import { TbGridDots } from "react-icons/tb";
+export default function HomeHeader() {
+  return (
+    <header className="flex justify-end p-5 text-sm">
+    </header>
+  );
+}

src/components/HomeSearch.jsx ADDED Viewed

	@@ -0,0 +1,62 @@

+"use client";
+import { useState } from "react";
+import { useRouter } from "next/navigation";
+import { AiOutlineSearch } from "react-icons/ai";
+import { BsFillMicFill } from "react-icons/bs";
+export default function HomeSearch() {
+  const router = useRouter();
+  const [input, setInput] = useState("");
+  const [randomSearchLoading, setRandomSearchLoading] = useState(false);
+  function handleSubmit(e) {
+    e.preventDefault();
+    if (!input.trim()) return;
+    router.push(`/search/web?searchTerm=${input}`);
+  }
+  async function randomSearch() {
+    setRandomSearchLoading(true);
+    const response = await fetch("https://random-word-api.herokuapp.com/word")
+      .then((res) => res.json())
+      .then((data) => data[0]);
+    if (!response) return;
+    router.push(`/search/web?searchTerm=${response}`);
+    setRandomSearchLoading(false);
+  }
+  return (
+    <>
+      <form
+        onSubmit={handleSubmit}
+        className="flex w-full mt-5 mx-auto max-w-[90%] border border-gray-200 px-5 py-3 rounded-full hover:shadow-md focus-within:shadow-md transition-shadow sm:max-w-xl lg:max-w-2xl"
+      >
+        <AiOutlineSearch className="text-xl text-gray-500 mr-3" />
+        <input
+          type="text"
+          className="flex-grow focus:outline-none"
+          onChange={(e) => setInput(e.target.value)}
+          value={input}
+        />
+      </form>
+      <div className="flex flex-col space-y-2 sm:space-y-0 sm:space-x-4 justify-center sm:flex-row mt-8 ">
+        <button onClick={handleSubmit} className="btn">
+          Google Search
+        </button>
+        <button
+          disabled={randomSearchLoading}
+          onClick={randomSearch}
+          className="btn flex items-center justify-center disabled:opacity-80"
+        >
+          {randomSearchLoading ? (
+            <img
+              src="spinner.svg"
+              alt="loading..."
+              className="h-6 text-center"
+            />
+          ) : (
+            "I'm feeling lucky"
+          )}
+        </button>
+      </div>
+    </>
+  );
+}

src/components/ImageSearchResults.jsx ADDED Viewed

	@@ -0,0 +1,37 @@

+import Link from "next/link";
+import PaginationButtons from "./PaginationButtons";
+export default function ImageSearchResults({ results }) {
+  return (
+    <div className="sm:pb-24 pb-40  mt-4">
+      <div className="grid grid-cols-1 sm:grid-cols-2 lg:grid-cols-3 xl:grid-cols-4 px-3 space-x-4">
+        {results.items.map((result) => (
+          <div key={result.link} className="mb-8">
+            <div className="group">
+              <Link href={result.image.contextLink}>
+                <img
+                  src={result.link}
+                  alt={result.title}
+                  className="h-60 group-hover:shadow-xl w-full object-contain transition-shadow"
+                />
+              </Link>
+              <Link href={result.image.contextLink}>
+                <h2 className="group-hover:underline truncate text-xl">
+                  {result.title}
+                </h2>
+              </Link>
+              <Link href={result.image.contextLink}>
+                <p className="group-hover:underline text-gray-600">
+                  {result.displayLink}
+                </p>
+              </Link>
+            </div>
+          </div>
+        ))}
+      </div>
+      <div className="ml-16">
+        <PaginationButtons />
+      </div>
+    </div>
+  );
+}

src/components/PaginationButtons.jsx ADDED Viewed

	@@ -0,0 +1,37 @@

+"use client";
+import Link from "next/link";
+import { usePathname, useSearchParams } from "next/navigation";
+import { BsChevronLeft, BsChevronRight } from "react-icons/bs";
+export default function PaginationButtons() {
+  const pathname = usePathname();
+  const searchParams = useSearchParams();
+  const searchTerm = searchParams.get("searchTerm");
+  const startIndex = +searchParams.get("start") || 1;
+  return (
+    <div className="text-blue-700 flex px-10 pb-4 justify-between sm:justify-start sm:space-x-44 sm:px-0">
+      {startIndex >= 10 && (
+        <Link
+          href={`${pathname}?searchTerm=${searchTerm}&start=${startIndex - 10}`}
+        >
+          <div className="flex flex-col cursor-pointer items-center hover:underline">
+            <BsChevronLeft className="h-5" />
+            <p>Previous</p>
+          </div>
+        </Link>
+      )}
+      {startIndex <= 90 && (
+        <Link
+          href={`${pathname}?searchTerm=${searchTerm}&start=${startIndex + 10}`}
+        >
+          <div className="flex flex-col cursor-pointer items-center hover:underline">
+            <BsChevronRight className="h-5" />
+            <p>Next</p>
+          </div>
+        </Link>
+      )}
+    </div>
+  );
+}

src/components/SearchBox.jsx ADDED Viewed

	@@ -0,0 +1,42 @@

+"use client";
+import { useSearchParams, useRouter } from "next/navigation";
+import { RxCross2 } from "react-icons/rx";
+import { BsFillMicFill } from "react-icons/bs";
+import { AiOutlineSearch } from "react-icons/ai";
+import { useState } from "react";
+export default function SearchBox() {
+  const searchParams = useSearchParams();
+  const router = useRouter();
+  const searchTerm = searchParams.get("searchTerm");
+  const [term, setTerm] = useState(searchTerm || "");
+  function handleSubmit(e) {
+    e.preventDefault();
+    if (!term.trim()) return;
+    router.push(`/search/web?searchTerm=${term}`);
+  }
+  return (
+    <form
+      className="flex border border-gray-200 rounded-full shadow-lg px-6 py-3 ml-10 mr-5 flex-grow max-w-3xl items-center"
+      onSubmit={handleSubmit}
+    >
+      <input
+        type="text"
+        className="w-full focus:outline-none"
+        value={term}
+        onChange={(e) => setTerm(e.target.value)}
+      />
+      <RxCross2
+        className="text-2xl text-gray-500 cursor-pointer sm:mr-2"
+        onClick={() => setTerm("")}
+      />
+      <BsFillMicFill className="hidden sm:inline-flex text-4xl text-blue-500 pl-4 border-l-2 border-gray-300 mr-3" />
+      <AiOutlineSearch
+        className="text-2xl hidden sm:inline-flex text-blue-500 cursor-pointer"
+        onClick={handleSubmit}
+      />
+    </form>
+  );
+}

src/components/SearchHeader.jsx ADDED Viewed

	@@ -0,0 +1,33 @@

+import Image from "next/image";
+import Link from "next/link";
+import SearchBox from "./SearchBox";
+import { RiSettings3Line } from "react-icons/ri";
+import { TbGridDots } from "react-icons/tb";
+import SearchHeaderOptions from "./SearchHeaderOptions";
+export default function SearchHeader() {
+  return (
+    <header className="sticky top-0 bg-white">
+      <div className="flex w-full p-6 items-center justify-between">
+        <Link href={"/"}>
+          <Image
+            width="120"
+            height="40"
+            src="https://upload.wikimedia.org/wikipedia/commons/thumb/2/2f/Google_2015_logo.svg/640px-Google_2015_logo.svg.png"
+          />
+        </Link>
+        <div className="flex-1">
+          <SearchBox />
+        </div>
+        <div className="hidden md:inline-flex space-x-2 ">
+          <RiSettings3Line className="header-icon" />
+          <TbGridDots className="header-icon" />
+        </div>
+        <button className="bg-blue-500 text-white px-6 py-2 font-medium rounded-md hover:brightness-105 hover:shadow-md transition-all ml-2">
+          Sign in
+        </button>
+      </div>
+      <SearchHeaderOptions />
+    </header>
+  );
+}

src/components/SearchHeaderOptions.jsx ADDED Viewed

	@@ -0,0 +1,25 @@

+"use client"
+import { AiOutlineCamera, AiOutlineSearch } from "react-icons/ai";
+import { usePathname, useRouter, useSearchParams } from "next/navigation";
+export default function SearchHeaderOptions() {
+  const pathname = usePathname();
+  const router = useRouter();
+  const searchParams = useSearchParams();
+  const searchTerm = searchParams.get("searchTerm");
+  function selectTab(tab) {
+    router.push(`/search/${tab === "Images" ? "image" : "web"}?searchTerm=${searchTerm}`);
+  }
+  return (
+    <div className="flex space-x-2 select-none border-b w-full justify-center lg:justify-start lg:pl-52 text-gray-700 text-sm">
+      <div onClick={()=>selectTab("All")} className={`flex items-center space-x-1 border-b-4 border-transparent active:text-blue-500 cursor-pointer pb-3 px-2 ${pathname === "/search/web" && "!text-blue-600 !border-blue-600"}`}>
+        <AiOutlineSearch className="text-md"/>
+        <p>All</p>
+      </div>
+      <div onClick={()=>selectTab("Images")} className={`flex items-center space-x-1 border-b-4 border-transparent active:text-blue-500 cursor-pointer pb-3 px-2 ${pathname === "/search/image" && "!text-blue-600 !border-blue-600"}`}>
+        <AiOutlineCamera className="text-md"/>
+        <p>Images</p>
+      </div>
+    </div>
+  )
+}

src/components/WebSearchResults.jsx ADDED Viewed

	@@ -0,0 +1,31 @@

+import Link from "next/link";
+import Parser from "html-react-parser";
+import PaginationButtons from "./PaginationButtons";
+export default function WebSearchResults({ results }) {
+  return (
+    <div className="w-full mx-auto px-3 pb-40 sm:pb-24 sm:pl-[5%] md:pl-[14%] lg:pl-52">
+      <p className="text-gray-600 text-sm mb-5 mt-3">
+        About {results.searchInformation?.formattedTotalResults} results (
+        {results.searchInformation?.formattedSearchTime} seconds)
+      </p>
+      {results.items?.map((result) => (
+        <div className="mb-8 max-w-xl" key={result.link}>
+          <div className="group flex flex-col">
+            <Link className="text-sm truncate" href={result.link}>
+              {result.formattedUrl}
+            </Link>
+            <Link
+              className="group-hover:underline decoration-blue-800 text-xl truncate font-medium text-blue-800"
+              href={result.link}
+            >
+              {result.title}
+            </Link>
+          </div>
+          <p className="text-gray-600">{Parser(result.htmlSnippet)}</p>
+        </div>
+      ))}
+      <PaginationButtons />
+    </div>
+  );
+}

tailwind.config.js ADDED Viewed

	@@ -0,0 +1,15 @@

+/** @type {import('tailwindcss').Config} */
+module.exports = {
+  content: [
+    "./app/**/*.{js,ts,jsx,tsx}",
+    "./pages/**/*.{js,ts,jsx,tsx}",
+    "./components/**/*.{js,ts,jsx,tsx}",
+    // Or if using `src` directory:
+    "./src/**/*.{js,ts,jsx,tsx}",
+  ],
+  theme: {
+    extend: {},
+  },
+  plugins: [],
+}

utils.py DELETED Viewed

@@ -1,57 +0,0 @@
-import os
-import gradio as gr
-from zipfile import ZipFile
-from presets import *
-def refresh_json_list(plain=False):
-    json_list = []
-    for root, dirs, files in os.walk("./index"):
-        for file in files:
-            if os.path.splitext(file)[1] == '.json':
-                json_list.append(os.path.splitext(file)[0])
-    if plain:
-        return json_list
-    return gr.Dropdown.update(choices=json_list)
-def upload_file(file_obj):
-    files = []
-    with ZipFile(file_obj.name) as zfile:
-        for zinfo in zfile.infolist():
-            files.append(
-                {
-                    "name": zinfo.filename,
-                }
-            )
-    return files
-def reset_textbox():
-    return gr.update(value='')
-def change_prompt_tmpl(tmpl_select):
-    new_tmpl = prompt_tmpl_dict[tmpl_select]
-    return gr.update(value=new_tmpl)
-def change_refine_tmpl(refine_select):
-    new_tmpl = refine_tmpl_dict[refine_select]
-    return gr.update(value=new_tmpl)
-def lock_params(index_type):
-    if index_type == "GPTVectorStoreIndex" or index_type == "GPTListIndex":
-        return gr.Slider.update(interactive=False, label="子节点数量（当前索引类型不可用）"), gr.Slider.update(interactive=False, label="每段关键词数量（当前索引类型不可用）")
-    elif index_type == "GPTTreeIndex":
-        return gr.Slider.update(interactive=True, label="子节点数量"), gr.Slider.update(interactive=False, label="每段关键词数量（当前索引类型不可用）")
-    elif index_type == "GPTKeywordTableIndex":
-        return gr.Slider.update(interactive=False, label="子节点数量（当前索引类型不可用）"), gr.Slider.update(interactive=True, label="每段关键词数量")
-def add_space(text):
-    punctuations = {'，': '， ', '。': '。 ', '？': '？ ', '！': '！ ', '：': '： ', '；': '； '}
-    for cn_punc, en_punc in punctuations.items():
-        text = text.replace(cn_punc, en_punc)
-    return text
-## create a test for parse_text
-def parse_text(text):
-    lines = text.split("\n")
-    lines = [line for line in lines if line != ""]
-    text = "".join(lines)
-    return text