1 jaar geleden · 1aecd00924
--- a/README.md
+++ b/README.md
@@ -2,6 +2,9 @@
 
				 
			
 
				 The 'llama-recipes' repository is a companion to the [Llama 2 model](https://github.com/facebookresearch/llama). The goal of this repository is to provide examples to quickly get started with fine-tuning for domain adaptation and how to run inference for the fine-tuned models. For ease of use, the examples use Hugging Face converted versions of the models. See steps for conversion of the model [here](#model-conversion-to-hugging-face).
			
 
				 
			
 
				+In addition, we also provide a number of demo apps, to showcase the Llama2 usage along with other ecosystem solutions to run Llama2 locally on your mac and on cloud.
			
 
				+
			
 
				+
			
 
				 Llama 2 is a new technology that carries potential risks with use. Testing conducted to date has not — and could not — cover all scenarios. In order to help developers address these risks, we have created the [Responsible Use Guide](https://github.com/facebookresearch/llama/blob/main/Responsible-Use-Guide.pdf). More details can be found in our research paper as well. For downloading the models, follow the instructions on [Llama 2 repo](https://github.com/facebookresearch/llama).
			
 
				 
			
 
				 
			
@@ -13,8 +16,9 @@ Llama 2 is a new technology that carries potential risks with use. Testing condu
 
				     - [Multi GPU One Node](#multiple-gpus-one-node)
			
 
				     - [Multi GPU Multi Node](#multi-gpu-multi-node)
			
 
				 4. [Inference](./docs/inference.md)
			
 
				-5. [Repository Organization](#repository-organization)
			
 
				-6. [License and Acceptable Use Policy](#license)
			
 
				+5. [Demo Apps](#demo-apps)
			
 
				+6. [Repository Organization](#repository-organization)
			
 
				+7. [License and Acceptable Use Policy](#license)
			
 
				 
			
 
				 
			
 
				 
			
@@ -174,6 +178,17 @@ sbatch multi_node.slurm
 
				 ```
			
 
				 You can read more about our fine-tuning strategies [here](./docs/LLM_finetuning.md).
			
 
				 
			
 
				+# Demo Apps
			
 
				+This folder contains a series of Llama2-powered apps:
			
 
				+* Quickstart Llama deployments and basic interactions with Llama
			
 
				+1. Llama on your Mac and ask Llama general questions
			
 
				+2. Llama on Google Colab
			
 
				+3. Llama on Cloud and ask Llama questions about unstructured data in a PDF
			
 
				+
			
 
				+* Specialized Llama use cases:
			
 
				+1. Ask Llama to summarize a video content
			
 
				+2. Ask Llama questions about structured data in a DB
			
 
				+3. Ask Llama questions about live data on the web
			
 
				 
			
 
				 # Repository Organization
			
 
				 This repository is organized in the following way:
			
@@ -184,6 +199,8 @@ This repository is organized in the following way:
 
				 
			
 
				 [datasets](src/llama_recipes/datasets/): Contains individual scripts for each dataset to download and process. Note: Use of any of the datasets should be in compliance with the dataset's underlying licenses (including but not limited to non-commercial uses)
			
 
				 
			
 
				+[demo_apps](./demo_apps) contains a series of Llama2-powered apps, from quickstart deployments to how to ask Llama questions about unstructured data, structured data, live data, and video summary.
			
 
				+
			
 
				 [examples](./examples/): Contains examples script for finetuning and inference of the Llama 2 model as well as how to use them safely.
			
 
				 
			
 
				 [inference](src/llama_recipes/inference/): Includes modules for inference for the fine-tuned models.
			
--- a/demo_apps/HelloLlamaCloud.ipynb
+++ b/demo_apps/HelloLlamaCloud.ipynb
--- a/demo_apps/HelloLlamaLocal.ipynb
+++ b/demo_apps/HelloLlamaLocal.ipynb
--- a/demo_apps/LiveData.ipynb
+++ b/demo_apps/LiveData.ipynb
--- a/demo_apps/Llama2_Gradio.ipynb
+++ b/demo_apps/Llama2_Gradio.ipynb
@@ -0,0 +1,96 @@
 
				+{
			
 
				+ "cells": [
			
 
				+  {
			
 
				+   "cell_type": "code",
			
 
				+   "execution_count": 1,
			
 
				+   "id": "928041cc",
			
 
				+   "metadata": {},
			
 
				+   "outputs": [
			
 
				+    {
			
 
				+     "name": "stderr",
			
 
				+     "output_type": "stream",
			
 
				+     "text": [
			
 
				+      "Init param `input` is deprecated, please use `model_kwargs` instead.\n"
			
 
				+     ]
			
 
				+    },
			
 
				+    {
			
 
				+     "name": "stdout",
			
 
				+     "output_type": "stream",
			
 
				+     "text": [
			
 
				+      "Running on local URL:  http://127.0.0.1:7860\n",
			
 
				+      "\n",
			
 
				+      "To create a public link, set `share=True` in `launch()`.\n"
			
 
				+     ]
			
 
				+    },
			
 
				+    {
			
 
				+     "data": {
			
 
				+      "text/html": [
			
 
				+       "<div><iframe src=\"http://127.0.0.1:7860/\" width=\"100%\" height=\"500\" allow=\"autoplay; camera; microphone; clipboard-read; clipboard-write;\" frameborder=\"0\" allowfullscreen></iframe></div>"
			
 
				+      ],
			
 
				+      "text/plain": [
			
 
				+       "<IPython.core.display.HTML object>"
			
 
				+      ]
			
 
				+     },
			
 
				+     "metadata": {},
			
 
				+     "output_type": "display_data"
			
 
				+    },
			
 
				+    {
			
 
				+     "data": {
			
 
				+      "text/plain": []
			
 
				+     },
			
 
				+     "execution_count": 1,
			
 
				+     "metadata": {},
			
 
				+     "output_type": "execute_result"
			
 
				+    }
			
 
				+   ],
			
 
				+   "source": [
			
 
				+    "from langchain.schema import AIMessage, HumanMessage\n",
			
 
				+    "import gradio as gr\n",
			
 
				+    "from langchain.llms import Replicate\n",
			
 
				+    "import os\n",
			
 
				+    "\n",
			
 
				+    "os.environ[\"REPLICATE_API_TOKEN\"] = \"<your replicate api token>\"\n",
			
 
				+    "\n",
			
 
				+    "llama2_13b_chat = \"meta/llama-2-13b-chat:f4e2de70d66816a838a89eeeb621910adffb0dd0baba3976c96980970978018d\"\n",
			
 
				+    "\n",
			
 
				+    "llm = Replicate(\n",
			
 
				+    "    model=llama2_13b_chat,\n",
			
 
				+    "    model_kwargs={\"temperature\": 0.01, \"top_p\": 1, \"max_new_tokens\":500}\n",
			
 
				+    ")\n",
			
 
				+    "\n",
			
 
				+    "\n",
			
 
				+    "def predict(message, history):\n",
			
 
				+    "    history_langchain_format = []\n",
			
 
				+    "    for human, ai in history:\n",
			
 
				+    "        history_langchain_format.append(HumanMessage(content=human))\n",
			
 
				+    "        history_langchain_format.append(AIMessage(content=ai))\n",
			
 
				+    "    history_langchain_format.append(HumanMessage(content=message))\n",
			
 
				+    "    gpt_response = llm(message) #history_langchain_format)\n",
			
 
				+    "    return gpt_response#.content\n",
			
 
				+    "\n",
			
 
				+    "gr.ChatInterface(predict).launch()"
			
 
				+   ]
			
 
				+  }
			
 
				+ ],
			
 
				+ "metadata": {
			
 
				+  "kernelspec": {
			
 
				+   "display_name": "Python 3 (ipykernel)",
			
 
				+   "language": "python",
			
 
				+   "name": "python3"
			
 
				+  },
			
 
				+  "language_info": {
			
 
				+   "codemirror_mode": {
			
 
				+    "name": "ipython",
			
 
				+    "version": 3
			
 
				+   },
			
 
				+   "file_extension": ".py",
			
 
				+   "mimetype": "text/x-python",
			
 
				+   "name": "python",
			
 
				+   "nbconvert_exporter": "python",
			
 
				+   "pygments_lexer": "ipython3",
			
 
				+   "version": "3.8.18"
			
 
				+  }
			
 
				+ },
			
 
				+ "nbformat": 4,
			
 
				+ "nbformat_minor": 5
			
 
				+}
			
--- a/demo_apps/README.md
+++ b/demo_apps/README.md
--- a/demo_apps/StructuredLlama.ipynb
+++ b/demo_apps/StructuredLlama.ipynb
--- a/demo_apps/VideoSummary.ipynb
+++ b/demo_apps/VideoSummary.ipynb
--- a/demo_apps/csv2db.py
+++ b/demo_apps/csv2db.py
@@ -0,0 +1,38 @@
 
				+import sqlite3
			
 
				+import csv
			
 
				+
			
 
				+# Define the input CSV file and the SQLite database file
			
 
				+input_csv = 'nba_roster.csv'
			
 
				+database_file = 'nba_roster.db'
			
 
				+
			
 
				+# Connect to the SQLite database
			
 
				+conn = sqlite3.connect(database_file)
			
 
				+cursor = conn.cursor()
			
 
				+
			
 
				+# Create a table to store the data
			
 
				+cursor.execute('''CREATE TABLE IF NOT EXISTS nba_roster (
			
 
				+                    Team TEXT,
			
 
				+                    NAME TEXT,
			
 
				+                    Jersey TEXT,
			
 
				+                    POS TEXT,
			
 
				+                    AGE INT,
			
 
				+                    HT TEXT,
			
 
				+                    WT TEXT,
			
 
				+                    COLLEGE TEXT,
			
 
				+                    SALARY TEXT
			
 
				+                )''')
			
 
				+
			
 
				+# Read data from the CSV file and insert it into the SQLite table
			
 
				+with open(input_csv, 'r', newline='') as csvfile:
			
 
				+    csv_reader = csv.reader(csvfile)
			
 
				+    next(csv_reader)  # Skip the header row
			
 
				+    
			
 
				+    for row in csv_reader:
			
 
				+        cursor.execute('INSERT INTO nba_roster VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?)', row)
			
 
				+
			
 
				+# Commit the changes and close the database connection
			
 
				+conn.commit()
			
 
				+conn.close()
			
 
				+
			
 
				+print(f'Data from {input_csv} has been successfully imported into {database_file}')
			
 
				+
			
--- a/demo_apps/llama2-gradio.png
+++ b/demo_apps/llama2-gradio.png
--- a/demo_apps/llama2-streamlit.png
+++ b/demo_apps/llama2-streamlit.png
--- a/demo_apps/llama2-streamlit2.png
+++ b/demo_apps/llama2-streamlit2.png
--- a/demo_apps/llama2.pdf
+++ b/demo_apps/llama2.pdf
--- a/demo_apps/nba.txt
+++ b/demo_apps/nba.txt
--- a/demo_apps/streamlit_llama2.py
+++ b/demo_apps/streamlit_llama2.py
@@ -0,0 +1,22 @@
 
				+import streamlit as st
			
 
				+from langchain.llms import Replicate
			
 
				+import os
			
 
				+
			
 
				+st.title("Llama2-powered Streamlit App")
			
 
				+
			
 
				+with st.sidebar:
			
 
				+    os.environ["REPLICATE_API_TOKEN"] = "<your replicate api token>"
			
 
				+
			
 
				+def generate_response(input_text):
			
 
				+    llama2_13b_chat = "meta/llama-2-13b-chat:f4e2de70d66816a838a89eeeb621910adffb0dd0baba3976c96980970978018d"
			
 
				+
			
 
				+    llm = Replicate(
			
 
				+        model=llama2_13b_chat,
			
 
				+        model_kwargs={"temperature": 0.01, "top_p": 1, "max_new_tokens":500}
			
 
				+    )
			
 
				+    st.info(llm(input_text))
			
 
				+
			
 
				+with st.form("my_form"):
			
 
				+    text = st.text_area("Enter text:", "What is Generative AI?")
			
 
				+    submitted = st.form_submit_button("Submit")
			
 
				+    generate_response(text)
			
--- a/demo_apps/txt2csv.py
+++ b/demo_apps/txt2csv.py
@@ -0,0 +1,53 @@
 
				+import csv
			
 
				+
			
 
				+# Define the input and output file names
			
 
				+input_file = 'nba.txt'
			
 
				+output_file = 'nba_roster.csv'
			
 
				+
			
 
				+# Initialize lists to store data
			
 
				+roster_data = []
			
 
				+current_team = None
			
 
				+
			
 
				+# Open the input file
			
 
				+with open(input_file, 'r') as file:
			
 
				+    for line in file:
			
 
				+        # Remove leading and trailing whitespaces from the line
			
 
				+        line = line.strip()
			
 
				+        
			
 
				+        # Check if the line starts with 'https', skip it
			
 
				+        if line.startswith('https'):
			
 
				+            continue
			
 
				+        
			
 
				+        # Check if the line contains the team name
			
 
				+        if 'Roster' in line:
			
 
				+            current_team = line.split(' Roster ')[0]
			
 
				+        elif line and "NAME" not in line:  # Skip empty lines and header lines
			
 
				+            # Split the line using tabs as the delimiter
			
 
				+            player_info = line.split('\t')
			
 
				+            
			
 
				+            # Remove any numbers from the player's name and set Jersey accordingly
			
 
				+            name = ''.join([c for c in player_info[0] if not c.isdigit()])
			
 
				+            jersey = ''.join([c for c in player_info[0] if c.isdigit()])
			
 
				+            
			
 
				+            # If no number found, set Jersey to "NA"
			
 
				+            if not jersey:
			
 
				+                jersey = "NA"
			
 
				+            
			
 
				+            # Append the team name, name, and jersey to the player's data
			
 
				+            player_info = [current_team, name, jersey] + player_info[1:]
			
 
				+            
			
 
				+            # Append the player's data to the roster_data list
			
 
				+            roster_data.append(player_info)
			
 
				+
			
 
				+# Write the data to a CSV file
			
 
				+with open(output_file, 'w', newline='') as csvfile:
			
 
				+    writer = csv.writer(csvfile)
			
 
				+    
			
 
				+    # Write the header row
			
 
				+    writer.writerow(['Team', 'NAME', 'Jersey', 'POS', 'AGE', 'HT', 'WT', 'COLLEGE', 'SALARY'])
			
 
				+    
			
 
				+    # Write the player data
			
 
				+    writer.writerows(roster_data)
			
 
				+
			
 
				+print(f'Conversion completed. Data saved to {output_file}')
			
 
				+
			
--- a/scripts/spellcheck_conf/wordlist.txt
+++ b/scripts/spellcheck_conf/wordlist.txt
@@ -1156,4 +1156,30 @@ Autocast
 
				 FN
			
 
				 GBs
			
 
				 MLP
			
 
				-learnable
			
 
				+learnable
			
 
				+Colab
			
 
				+GenAI
			
 
				+Gradio
			
 
				+HelloLlama
			
 
				+HelloLlamaCloud
			
 
				+HelloLlamaLocal
			
 
				+LLM's
			
 
				+LangChain
			
 
				+LangChain's
			
 
				+LiveData
			
 
				+LlamaIndex
			
 
				+MBP
			
 
				+MLC
			
 
				+Replicate's
			
 
				+StructuredLlama
			
 
				+VideoSummary
			
 
				+cpp
			
 
				+envinronment
			
 
				+ggml
			
 
				+gguf
			
 
				+gradio
			
 
				+minnutes
			
 
				+pdf
			
 
				+quantized
			
 
				+serarch
			
 
				+streamlit