Dspy

https://dspy.ai/ | https://github.com/stanfordnlp/dspy | https://discord.gg/XCGy2WDCQB | https://www.youtube.com/watch?v=JEMYuzrKLUw - CS 194/294-196 (LLM Agents) - Lecture 5, Omar Khattab

import os

import dspy

lm = dspy.LM("openai/gpt-4o-mini", api_key=os.environ.get("OPEN_API_KEY"))

dspy.configure(lm=lm)

lm("Say this is a test!", temperature=0.7)

lm(messages=[{"role": "user", "content": "Say this is a test!"}])

math = dspy.ChainOfThought("question -> answer: float")

math(question="Two dice are tossed. What is the probability that the sum equals two?")

def search_wikipedia(query: str) -> list[str]:

results = dspy.ColBERTv2(url='http://20.102.90.50:2017/wiki17_abstracts')(query, k=3)

return [x['text'] for x in results]

rag = dspy.ChainOfThought('context, question -> response')

question = "What's the name of the castle that David Gregory inherited?"

rag(context=search_wikipedia(question), question=question)

from typing import Literal

class Classify(dspy.Signature):

"""Classify sentiment of a given sentence."""

sentence: str = dspy.InputField()

sentiment: Literal['positive', 'negative', 'neutral'] = dspy.OutputField()

confidence: float = dspy.OutputField()

classify = dspy.Predict(Classify)

classify(sentence="This book was super fun to read, though not the last chapter.")

class ExtractInfo(dspy.Signature):

"""Extract structured information from text."""

text: str = dspy.InputField()

title: str = dspy.OutputField()

headings: list[str] = dspy.OutputField()

entities: list[dict[str, str]] = dspy.OutputField(desc="a list of entities and their metadata")

module = dspy.Predict(ExtractInfo)

text = "Apple Inc. announced its latest iPhone 14 today." \

"The CEO, Tim Cook, highlighted its new features in a press release."

response = module(text=text)

print(response.title)

print(response.headings)

print(response.entities)

def evaluate_math(expression: str):

return dspy.PythonInterpreter({}).execute(expression)

def search_wikipedia(query: str):

results = dspy.ColBERTv2(url='http://20.102.90.50:2017/wiki17_abstracts')(query, k=3)

return [x['text'] for x in results]

react = dspy.ReAct("question -> answer: float", tools=[evaluate_math, search_wikipedia])

pred = react(question="What is 9362158 divided by the year of birth of David Gregory of Kinnairdy castle?")

print(pred.answer)

class Outline(dspy.Signature):

"""Outline a thorough overview of a topic."""

topic: str = dspy.InputField()

title: str = dspy.OutputField()

sections: list[str] = dspy.OutputField()

section_subheadings: dict[str, list[str]] = dspy.OutputField(desc="mapping from section headings to subheadings")

class DraftSection(dspy.Signature):

"""Draft a top-level section of an article."""

topic: str = dspy.InputField()

section_heading: str = dspy.InputField()

section_subheadings: list[str] = dspy.InputField()

content: str = dspy.OutputField(desc="markdown-formatted section")

class DraftArticle(dspy.Module):

def __init__(self):

self.build_outline = dspy.ChainOfThought(Outline)

self.draft_section = dspy.ChainOfThought(DraftSection)

def forward(self, topic):

outline = self.build_outline(topic=topic)

sections = []

for heading, subheadings in outline.section_subheadings.items():

section, subheadings = f"## {heading}", [f"### {subheading}" for subheading in subheadings]

section = self.draft_section(topic=outline.title, section_heading=section, section_subheadings=subheadings)

sections.append(section.content)

return dspy.Prediction(title=outline.title, sections=sections)

draft_article = DraftArticle()

article = draft_article(topic="World Cup 2002")

import dspy

from dspy.datasets import HotPotQA

dspy.configure(lm=dspy.LM('openai/gpt-4o-mini'))

def search_wikipedia(query: str) -> list[str]:

results = dspy.ColBERTv2(url='http://20.102.90.50:2017/wiki17_abstracts')(query, k=3)

return [x['text'] for x in results]

trainset = [x.with_inputs('question') for x in HotPotQA(train_seed=2024, train_size=500).train]

react = dspy.ReAct("question -> answer", tools=[search_wikipedia])

tp = dspy.MIPROv2(metric=dspy.evaluate.answer_exact_match, auto="light", num_threads=24)

optimized_react = tp.compile(react, trainset=trainset)

class RAG(dspy.Module):

def __init__(self, num_docs=5):

self.num_docs = num_docs

self.respond = dspy.ChainOfThought('context, question -> response')

def forward(self, question):

context = search(question, k=self.num_docs) # defined in tutorial linked below

return self.respond(context=context, question=question)

tp = dspy.MIPROv2(metric=dspy.evaluate.SemanticF1(decompositional=True), auto="medium", num_threads=24)

optimized_rag = tp.compile(RAG(), trainset=trainset, max_bootstrapped_demos=2, max_labeled_demos=2)

import random

from typing import Literal

from dspy.datasets import DataLoader

from datasets import load_dataset

# Load the Banking77 dataset.

CLASSES = load_dataset("PolyAI/banking77", split="train", trust_remote_code=True).features['label'].names

kwargs = dict(fields=("text", "label"), input_keys=("text",), split="train", trust_remote_code=True)

# Load the first 2000 examples from the dataset, and assign a hint to each *training* example.

trainset = [

dspy.Example(x, hint=CLASSES[x.label], label=CLASSES[x.label]).with_inputs("text", "hint")

for x in DataLoader().from_huggingface(dataset_name="PolyAI/banking77", **kwargs)[:2000]

]

random.Random(0).shuffle(trainset)

import dspy

dspy.configure(lm=dspy.LM('gpt-4o-mini-2024-07-18'))

# Define the DSPy module for classification. It will use the hint at training time, if available.

signature = dspy.Signature("text -> label").with_updated_fields('label', type_=Literal[tuple(CLASSES)])

classify = dspy.ChainOfThoughtWithHint(signature)

# Optimize via BootstrapFinetune.

optimizer = dspy.BootstrapFinetune(metric=(lambda x, y, trace=None: x.label == y.label), num_threads=24)

optimized = optimizer.compile(classify, trainset=trainset)

optimized_classifier(text="What does a pending cash withdrawal mean?")

Google Sites

Report abuse