--- LLM

!pip install -q -U transformers peft accelerate optimum bitsandbytes !pip install -q -U huggingface_hub !huggingface-cli login

from transformers import AutoModelForCausalLM, AutoTokenizer, GenerationConfig, TextStreamer

name = 'microsoft/phi-2'

model=AutoModelForCausalLM.from_pretrained(name, low_cpu_mem_usage=True, load_in_8bit=True) tokenizer=AutoTokenizer.from_pretrained(name) tokenizer.pad_token_id=tokenizer.eos_token_id

generation_config=GenerationConfig(max_new_tokens=500, temperature=0.4, top_p=0.95, top_k=40, repetition_penalty=1.2, bos_token_id=tokenizer.bos_token_id, eos_token_id=tokenizer.eos_token_id, do_sample=True, use_cache=True, output_attentions=False, output_hidden_states=False, output_scores=False, remove_invalid_values=True ) streamer = TextStreamer(tokenizer)

def ask_model(instruction, system='Du bist ein hilfreicher Assistent.'): prompt=f"{system} USER: {instruction} ASSISTANT:" input_tokens=tokenizer(prompt, return_tensors="pt").to(model.device) output_tokens=model.generate(**input_tokens, generation_config=generation_config, streamer=streamer)[0] answer=tokenizer.decode(output_tokens, skip_special_tokens=True) return answer

answer=ask_model('Wenn du 2024 als Bundeskanzler kandidieren würdest, was wäre dein Wahlprogramm?')

Example for Factual/Retrieval with less Hallucinations

Please use the Format and system message below for Factual retrieval. The model is trained to only answer from provided context and not hallucinate any answers or additional information.

retrieval_system="Du bist ein hilfreicher Assistent. Für die folgende Aufgabe stehen dir zwischen den tags BEGININPUT und ENDINPUT mehrere Quellen zur Verfügung. Metadaten zu den einzelnen Quellen wie Autor, URL o.ä. sind zwischen BEGINCONTEXT und ENDCONTEXT zu finden, danach folgt der Text der Quelle. Die eigentliche Aufgabe oder Frage ist zwischen BEGININSTRUCTION und ENDINCSTRUCTION zu finden. Beantworte diese wortwörtlich mit einem Zitat aus den Quellen. Sollten diese keine Antwort enthalten, antworte, dass auf Basis der gegebenen Informationen keine Antwort möglich ist!" retrieval_question="""
BEGININPUT BEGINCONTEXT Url: https://www.jph.me ENDCONTEXT Das Wetter in Düsseldorf wird heute schön und sonnig! ENDINPUT BEGININSTRUCTION Was ist 1+1? ENDINSTRUCTION""" ask_model(retrieval_question, system=retrieval_system)

retrieval_system="Du bist ein hilfreicher Assistent. Für die folgende Aufgabe stehen dir zwischen den tags BEGININPUT und ENDINPUT mehrere Quellen zur Verfügung. Metadaten zu den einzelnen Quellen wie Autor, URL o.ä. sind zwischen BEGINCONTEXT und ENDCONTEXT zu finden, danach folgt der Text der Quelle. Die eigentliche Aufgabe oder Frage ist zwischen BEGININSTRUCTION und ENDINCSTRUCTION zu finden. Beantworte diese wortwörtlich mit einem Zitat aus den Quellen. Sollten diese keine Antwort enthalten, antworte, dass auf Basis der gegebenen Informationen keine Antwort möglich ist!" retrieval_question="""
BEGININPUT BEGINCONTEXT Url: https://www.jph.me ENDCONTEXT Das Wetter in Düsseldorf wird heute schön und sonnig! ENDINPUT BEGININSTRUCTION Wie wird das Wetter heute in Düsseldorf? ENDINSTRUCTION""" ask_model(retrieval_question, system=retrieval_system)

--- Q/A:

Tutorial: Build Your First Question Answering System

https://haystack.deepset.ai/tutorials/01_basic_qa_pipeline

Q&A Model:

https://huggingface.co/deepset/roberta-base-squad2

from transformers import AutoModelForQuestionAnswering, AutoTokenizer, pipeline

model_name = "deepset/roberta-base-squad2"

model_name = "timpal0l/mdeberta-v3-base-squad2"

a) Get predictions

nlp = pipeline('question-answering', model=model_name, tokenizer=model_name)

QA_input = { 'question': 'Was ist Wikipedia?', 'context': 'Wikipedia ist ein Projekt zum Aufbau einer Enzyklopädie aus freien Inhalten, zu denen du sehr gern beitragen kannst. Seit März 2001 sind 2.874.691 Artikel in deutscher Sprache entstanden.' } res = nlp(QA_input)

b) Load model & tokenizer

model = AutoModelForQuestionAnswering.from_pretrained(model_name) tokenizer = AutoTokenizer.from_pretrained(model_name)

res

--- ChromaDB

https://www.datacamp.com/tutorial/chromadb-tutorial-step-by-step-guide

import chromadb

from numpy.distutils.system_info import umfpack_info

chroma_client = chromadb.Client()

chroma_client.reset()

collection_name = "my_collection" chroma_client.delete_collection(collection_name) collection = chroma_client.create_collection(name=collection_name)

student_info = """ Alexandra Thompson, a 19-year-old computer science sophomore with a 3.7 GPA, is a member of the programming and chess clubs who enjoys pizza, swimming, and hiking in her free time in hopes of working at a tech company after graduating from the University of Washington. """

club_info = """ The university chess club provides an outlet for students to come together and enjoy playing the classic strategy game of chess. Members of all skill levels are welcome, from beginners learning the rules to experienced tournament players. The club typically meets a few times per week to play casual games, participate in tournaments, analyze famous chess matches, and improve members' skills. """

university_info = """ The University of Washington, founded in 1861 in Seattle, is a public research university with over 45,000 students across three campuses in Seattle, Tacoma, and Bothell. As the flagship institution of the six public universities in Washington state, UW encompasses over 500 buildings and 20 million square feet of space, including one of the largest library systems in the world. """

collection.add( documents=[ student_info, club_info, university_info ], metadatas=[{"source": "student_info"}, {"source": "club_info"}, {"source": "university_info"}], ids=["id1", "id2", "id3"] )

results = collection.query( # query_texts=["How old is Alexandra Thompson?"], query_texts=["Where did Alexandra study?"], n_results=1 )

results

--- ChromaDB // from .txt

https://www.datacamp.com/tutorial/chromadb-tutorial-step-by-step-guide

import chromadb import os from langchain.text_splitter import RecursiveCharacterTextSplitter from langchain.embeddings import HuggingFaceEmbeddings

Initialize text splitter and embeddings

text_splitter = RecursiveCharacterTextSplitter(chunk_size=1000, chunk_overlap=100)

embeddings = HuggingFaceEmbeddings(model_name="BAAI/bge-large-en-v1.5")

chroma_client = chromadb.Client()

chroma_client.reset()

collection_name = "my_collection" chroma_client.delete_collection(collection_name) collection = chroma_client.create_collection(name=collection_name)

def read_text(file_path): with open(file_path, encoding="utf-8") as f: return f.read()

print(read_text('docs/example.txt'))

Process each TXT in the ./input directory

for filename in os.listdir('./docs'): if filename.endswith('.txt'): text = read_text(os.path.join('./docs', filename))

    # Split text into chunks
    chunks = text_splitter.split_text(text)

    # Convert chunks to vector representations and store in Chroma DB
    documents_list = []
    # embeddings_list = []
    ids_list = []

    for i, chunk in enumerate(chunks):
        # vector = embeddings.embed_query(chunk)

        documents_list.append(chunk)
        # embeddings_list.append(vector)
        ids_list.append(f"{filename}_{i}")


    collection.add(
        # embeddings=embeddings_list,
        documents=documents_list,
        ids=ids_list
    )

results = collection.query( # query_texts=["How old is Alexandra Thompson?"], # query_texts=["Where did Alexandra study?"], query_texts=["Was mag meine Katze?"], n_results=1 )

results['documents'][0][0]

reinforcement-learning-experiments / llm Goto Github PK

llm's Introduction

--- LLM

Example for Factual/Retrieval with less Hallucinations

--- Q/A:

Tutorial: Build Your First Question Answering System

Q&A Model:

model_name = "timpal0l/mdeberta-v3-base-squad2"

a) Get predictions

b) Load model & tokenizer

--- ChromaDB

from numpy.distutils.system_info import umfpack_info

chroma_client.reset()

--- ChromaDB // from .txt

Initialize text splitter and embeddings

embeddings = HuggingFaceEmbeddings(model_name="BAAI/bge-large-en-v1.5")

chroma_client.reset()

Process each TXT in the ./input directory

llm's People

Contributors

Watchers

Recommend Projects

Recommend Topics

Recommend Org