An AI package for Elixir that focuses on higher level application concerns. It will include an AI UI component library for Phoenix.
In your mix.exs:
While in active Alpha development it is probably best to pull it from Github
def deps do
  [
    {:mulberry, github: "agoodway/mulberry", branch: "main"}
  ]
enddef deps do
  [
    {:mulberry, "~> 0.1.0"}
  ]
endMulberry now includes a flexible LangChain configuration system that supports multiple LLM providers with sensible defaults. The simplest configuration uses environment variables:
# Choose your provider (defaults to :openai)
export MULBERRY_LLM_PROVIDER=openai
# Set API keys for the providers you want to use
export OPENAI_API_KEY=your-openai-key
export ANTHROPIC_API_KEY=your-anthropic-key
# For Brave search functionality
export BRAVE_API_KEY=your-brave-keyYou can configure LangChain providers programmatically in your runtime.exs:
# Legacy configuration (still supported)
config :langchain, openai_key: System.get_env("OPENAI_API_KEY")
config :mulberry, brave_api_key: System.get_env("BRAVE_API_KEY")
# New configuration system (optional - defaults are provided)
config :mulberry, :langchain,
  default_provider: :openai,
  providers: [
    openai: [
      model: "gpt-4",
      temperature: 0.7
    ],
    anthropic: [
      model: "claude-3-opus-20240229",
      temperature: 0.5
    ]
  ]
# Enable verbose logging for debugging
config :mulberry, :verbose_logging, true- :openai- OpenAI's GPT models (default)
- :anthropic- Anthropic's Claude models
- :google- Google's Gemini models
- :mistral- Mistral AI models
- :ollama- Local Ollama models
- :vertex_ai- Google Vertex AI
- :bumblebee- Local Bumblebee models
Each provider supports configuration through environment variables:
- MULBERRY_LLM_PROVIDER- Default provider to use
- MULBERRY_[PROVIDER]_API_KEY- API key for specific provider
- MULBERRY_[PROVIDER]_MODEL- Default model for provider
- MULBERRY_[PROVIDER]_TEMPERATURE- Temperature setting
- MULBERRY_[PROVIDER]_MAX_TOKENS- Max tokens setting
- MULBERRY_[PROVIDER]_ENDPOINT- Custom endpoint URL
Examples:
export MULBERRY_OPENAI_MODEL=gpt-4
export MULBERRY_ANTHROPIC_MODEL=claude-3-opus-20240229
export MULBERRY_OLLAMA_ENDPOINT=http://localhost:11434/api/chat# Use default provider (OpenAI by default)
{:ok, summary} = Mulberry.Text.summarize("Long text to summarize...")
# Use Anthropic's Claude
{:ok, summary} = Mulberry.Text.summarize("Long text...", provider: :anthropic)
# Use Google's Gemini with custom temperature
{:ok, summary} = Mulberry.Text.summarize("Long text...", 
  provider: :google, 
  temperature: 0.2
)
# Generate title with Mistral AI
{:ok, title} = Mulberry.Text.title("Article content...", 
  provider: :mistral,
  model: "mistral-large"
)
# Use local Ollama installation
{:ok, summary} = Mulberry.Text.summarize("Long text...", 
  provider: :ollama,
  model: "llama2",
  endpoint: "http://localhost:11434/api/chat"
)import Flamel.Wrap, only: [ok: 1]
alias Mulberry.Document
alias Flamel.Result
defp handle_upload(socket, entry) do
  {:ok, text} =
    consume_uploaded_entry(socket, entry, fn %{path: path} ->
      %{path: path, mime: entry.client_type}
      |> Document.File.new()
      |> Document.load()
      |> Result.map(fn file -> file.contents end)
      |> ok()
    end)
  socket
  |> assign(:file, AsyncResult.loading())
  |> start_async(:file, fn -> Files.parse_text(text) end)
endThe above example uses Flamel to handle :ok and :error tuples. See Result.map/2 and ok/1
Generate a summary of a web pages from a Brave Search API query:
alias Mulberry.Search.Brave
alias Mulberry.Document
# this chain can be applied to any Mulberry.Document whether it is a web page or an image file
def load_and_generate_summary(chain) do
  chain
  |> Chain.apply(&Document.load/1)
  |> Chain.apply(&Document.generate_summary/1)
  |> Chain.to_tuple()
end
Mulberry.search(Brave, "what is the best cake recipe?")
# apply this sequence of operations to each document returned from the search query
|> Enum.map(Chain.curry(&load_and_generate_summary/1))
# remove any results that resulted in an error
|> Enum.filter(&Result.ok?/1)The above example uses Flamel chain a couple operations on the document and filter non-ok results. See Flamel.Chain and Result.ok?/1
Mulberry supports multiple retriever strategies for fetching web content:
# Use default retriever (Req)
{:ok, webpage} = Mulberry.Document.WebPage.new("https://example.com")
                 |> Mulberry.Document.load()
# Use Playwright for JavaScript-heavy sites
{:ok, webpage} = Mulberry.Document.WebPage.new("https://spa-app.com")
                 |> Mulberry.Document.load(retriever: Mulberry.Retriever.Playwright)
# Use ScrapingBee with API key
{:ok, webpage} = Mulberry.Document.WebPage.new("https://protected-site.com")
                 |> Mulberry.Document.load(
                   retriever: Mulberry.Retriever.ScrapingBee,
                   api_key: "your-scrapingbee-key"
                 )
# Try multiple retrievers in sequence
retrievers = [Mulberry.Retriever.Req, Mulberry.Retriever.Playwright]
{:ok, webpage} = Mulberry.Document.WebPage.new("https://example.com")
                 |> Mulberry.Document.load(retriever: retrievers)# Load a webpage and convert to Markdown
{:ok, webpage} = Mulberry.Document.WebPage.new("https://blog.example.com/article")
                 |> Mulberry.Document.load()
{:ok, markdown} = Mulberry.Document.to_text(webpage)
# Convert HTML to Markdown directly
html = "<h1>Title</h1><p>Some <strong>bold</strong> text</p>"
{:ok, markdown} = Mulberry.HTML.to_markdown(html)
# => "# Title\n\nSome **bold** text"
# Extract clean text from HTML
html_tree = Floki.parse_document!(html)
text = Mulberry.HTML.to_readable_text(html_tree)# Summarize with custom options and strategies
article = "Long article text..."
{:ok, summary} = Mulberry.Text.summarize(article,
  provider: :anthropic,
  model: "claude-3-haiku-20240307",
  strategy: :map_reduce,  # Use map-reduce for long texts
  chunk_size: 1000,
  max_tokens: 150,
  system_message: "Summarize in bullet points"
)
# Generate keywords
{:ok, keywords} = Mulberry.Text.keywords(article, 
  count: 10,
  provider: :openai
)
# Create a title with specific style
{:ok, title} = Mulberry.Text.title(article,
  system_message: "Create a catchy, SEO-friendly title under 60 characters"
)
# Generate title with examples to guide style
{:ok, title} = Mulberry.Text.title(article,
  examples: ["10 Ways to Boost Productivity", "The Ultimate Guide to Elixir"],
  max_words: 10
)
# Title generation with fallback
{:ok, title} = Mulberry.Text.title(article,
  fallback_title: "Technology Article",
  verbose: true
)
# Classify content
{:ok, category} = Mulberry.Text.classify(article,
  categories: ["Technology", "Business", "Health", "Sports"],
  provider: :google
)
# Enable verbose logging for debugging
{:ok, summary} = Mulberry.Text.summarize(article, verbose: true)Mulberry now uses an advanced chain-based summarization system internally, providing multiple strategies for handling documents of any size:
alias Mulberry.Document
alias Mulberry.Text
# Load a document
{:ok, doc} = Document.WebPage.new(%{url: "https://example.com"})
             |> Document.load()
# Basic summarization (uses stuff strategy by default)
{:ok, doc_with_summary} = Document.generate_summary(doc)
# Summarization with different strategies:
# Stuff Strategy - concatenates all chunks and summarizes in one call (default)
{:ok, summary} = Document.generate_summary(doc,
  strategy: :stuff,
  chunk_size: 1000
)
# Map-Reduce Strategy - summarizes chunks independently then combines
{:ok, summary} = Document.generate_summary(doc,
  strategy: :map_reduce,
  chunk_size: 500,
  on_progress: fn stage, info ->
    IO.puts("Progress: #{stage} - #{inspect(info)}")
  end
)
# Refine Strategy - iteratively refines summary with each chunk
{:ok, summary} = Document.generate_summary(doc,
  strategy: :refine,
  chunk_overlap: 100
)
# Direct text summarization with advanced options
text = "Long article text..."
{:ok, summary} = Text.summarize(text,
  strategy: :map_reduce,
  chunk_size: 1000,
  provider: :anthropic,
  temperature: 0.3
)
# Custom prompts for specific summarization styles
{:ok, bullet_summary} = Document.generate_summary(doc,
  system_message: "Summarize as a bulleted list of key points"
)
# Works with any document type (WebPage, File, etc.)
{:ok, pdf_doc} = Document.File.new(%{path: "report.pdf"})
                 |> Document.load()
                 
{:ok, pdf_summary} = Document.generate_summary(pdf_doc,
  strategy: :map_reduce,
  provider: :anthropic
)
# Progress tracking for long documents
{:ok, summary} = Text.summarize(long_text,
  strategy: :map_reduce,
  on_progress: fn stage, info ->
    case stage do
      :chunking -> IO.puts("Splitting into #{info.chunk_count} chunks")
      :map -> IO.puts("Processing chunk #{info.current}/#{info.total}")
      :reduce -> IO.puts("Combining summaries...")
      :complete -> IO.puts("Summarization complete!")
    end
  end
)Mulberry provides several Mix tasks for common operations. For a complete reference of all available Mix tasks and their options, see the Mix Tasks Guide.
# Fetch and display a webpage
mix fetch_url https://example.com
# Perform web searches
mix search "elixir programming"
# Generate text summaries
mix text summarize --file article.txt
# Conduct research on topics
mix research "machine learning trends" --max-sources 10# Process search results in parallel
alias Mulberry.{Search, Document, Text}
urls = [
  "https://example1.com",
  "https://example2.com", 
  "https://example3.com"
]
# Load all pages concurrently
tasks = Enum.map(urls, fn url ->
  Task.async(fn ->
    Document.WebPage.new(url)
    |> Document.load()
  end)
end)
webpages = Task.await_many(tasks, 30_000)
           |> Enum.filter(&match?({:ok, _}, &1))
           |> Enum.map(fn {:ok, page} -> page end)
# Generate summaries for all pages
summaries = webpages
            |> Enum.map(&Document.to_text/1)
            |> Enum.map(fn {:ok, text} -> 
              Task.async(fn -> Text.summarize(text) end)
            end)
            |> Task.await_many(30_000)# Create a custom LLM function
custom_llm = fn messages, _config ->
  # Your custom LLM implementation
  response = MyLLMService.chat(messages)
  {:ok, response}
end
# Use with Mulberry functions
{:ok, summary} = Mulberry.Text.summarize("Text to summarize",
  llm: custom_llm,
  system_message: "Custom instructions"
)
# Chain operations with custom LLM
import Flamel.Chain
webpage
|> Chain.apply(&Document.load/1)
|> Chain.apply(&Document.to_text/1)
|> Chain.apply(&Text.summarize(&1, llm: custom_llm))
|> Chain.to_tuple()# Extract text from various file types
alias Mulberry.Document
# PDF file
{:ok, pdf} = Document.File.new(%{path: "/path/to/document.pdf", mime: "application/pdf"})
             |> Document.load()
{:ok, text} = Document.to_text(pdf)
# Image with OCR
{:ok, image} = Document.File.new(%{path: "/path/to/scan.png", mime: "image/png"})
               |> Document.load()
{:ok, text} = Document.to_text(image)
# Process uploaded files in Phoenix
def handle_event("upload", _params, socket) do
  consume_uploaded_entries(socket, :document, fn %{path: path}, entry ->
    file = Document.File.new(%{path: path, mime: entry.client_type})
    
    with {:ok, doc} <- Document.load(file),
         {:ok, text} <- Document.to_text(doc),
         {:ok, summary} <- Text.summarize(text) do
      {:ok, %{filename: entry.client_name, summary: summary}}
    end
  end)
  |> case do
    [{:ok, result}] -> 
      {:noreply, assign(socket, :result, result)}
    _ -> 
      {:noreply, put_flash(socket, :error, "Failed to process file")}
  end
endMulberry uses a flexible DocumentTransformer behavior that allows you to add custom transformations to documents. Here's how to create and use your own transformations:
# 1. Create a custom transformer module
defmodule MyApp.DocumentTransformer.Sentiment do
  @moduledoc """
  Custom transformer that adds sentiment analysis to documents.
  """
  
  @behaviour Mulberry.DocumentTransformer
  
  alias Mulberry.Text
  
  @impl true
  def transform(document, transformation, opts \\ [])
  
  # Add a new :sentiment transformation
  def transform(document, :sentiment, opts) do
    # Extract text from the document
    text = get_document_text(document)
    
    # Perform sentiment analysis (using your preferred method)
    sentiment = analyze_sentiment(text, opts)
    
    # Add the sentiment to the document
    {:ok, Map.put(document, :sentiment, sentiment)}
  end
  
  # Add a new :entities transformation for named entity recognition
  def transform(document, :entities, opts) do
    text = get_document_text(document)
    
    # Extract entities using an LLM
    prompt = "Extract all named entities (people, places, organizations) from this text: #{text}"
    
    case Text.classify(text, 
      categories: ["person", "place", "organization", "other"],
      system_message: prompt,
      provider: Keyword.get(opts, :provider, :openai)
    ) do
      {:ok, entities} ->
        {:ok, Map.put(document, :entities, entities)}
      {:error, reason} ->
        {:error, reason, document}
    end
  end
  
  # Delegate standard transformations to the default transformer
  def transform(document, transformation, opts) when transformation in [:summary, :keywords, :title] do
    Mulberry.DocumentTransformer.Default.transform(document, transformation, opts)
  end
  
  # Handle unknown transformations
  def transform(document, transformation, _opts) do
    {:error, {:unsupported_transformation, transformation}, document}
  end
  
  # Helper to extract text from various document types
  defp get_document_text(document) do
    cond do
      Map.has_key?(document, :markdown) && is_binary(document.markdown) -> document.markdown
      Map.has_key?(document, :content) && is_binary(document.content) -> document.content
      Map.has_key?(document, :contents) && is_binary(document.contents) -> document.contents
      true -> ""
    end
  end
  
  defp analyze_sentiment(text, opts) do
    # Simple example - you could use an LLM or sentiment analysis library
    provider = Keyword.get(opts, :provider, :openai)
    
    case Text.classify(text, 
      categories: ["positive", "negative", "neutral"],
      provider: provider
    ) do
      {:ok, sentiment} -> sentiment
      {:error, _} -> "unknown"
    end
  end
end
# 2. Use your custom transformer with documents
alias Mulberry.Document
# Load a webpage
{:ok, webpage} = Document.WebPage.new(%{url: "https://news.example.com/article"})
                 |> Document.load()
# Use the custom transformer for sentiment analysis
{:ok, webpage_with_sentiment} = Document.transform(webpage, :sentiment, 
  transformer: MyApp.DocumentTransformer.Sentiment
)
IO.puts("Sentiment: #{webpage_with_sentiment.sentiment}")
# Use multiple transformations
{:ok, analyzed_page} = webpage
                       |> Document.transform(:sentiment, transformer: MyApp.DocumentTransformer.Sentiment)
                       |> elem(1)
                       |> Document.transform(:entities, transformer: MyApp.DocumentTransformer.Sentiment)
# 3. Create a specialized transformer for a specific document type
defmodule MyApp.DocumentTransformer.NewsArticle do
  @behaviour Mulberry.DocumentTransformer
  
  @impl true
  def transform(document, :metadata, opts) do
    # Extract article metadata like author, date, etc.
    text = get_document_text(document)
    
    prompt = """
    Extract the following from this news article:
    - Author
    - Publication date
    - Main topic
    - Key quotes
    
    Article: #{text}
    """
    
    # Use an LLM to extract structured data
    # ... implementation ...
    
    {:ok, Map.put(document, :metadata, extracted_metadata)}
  end
  
  # ... other transformations ...
end
# 4. Chain transformations together
import Flamel.Chain
result = webpage
         |> Chain.apply(&Document.load/1)
         |> Chain.apply(&Document.transform(&1, :summary))
         |> Chain.apply(&Document.transform(&1, :sentiment, transformer: MyApp.DocumentTransformer.Sentiment))
         |> Chain.apply(&Document.transform(&1, :entities, transformer: MyApp.DocumentTransformer.Sentiment))
         |> Chain.to_tuple()
case result do
  {:ok, final_doc} ->
    IO.inspect(final_doc.summary)
    IO.inspect(final_doc.sentiment)
    IO.inspect(final_doc.entities)
  {:error, reason} ->
    IO.puts("Processing failed: #{inspect(reason)}")
end
# 5. Set a default transformer for all operations
# In your config/runtime.exs:
config :mulberry, :default_transformer, MyApp.DocumentTransformer.Sentiment
# Now all documents will use your transformer by default
{:ok, doc_with_sentiment} = Document.transform(webpage, :sentiment)
# No need to specify transformer optionThe DocumentTransformer behavior provides a clean, extensible way to add new document processing capabilities while maintaining compatibility with existing transformations like :summary, :keywords, and :title.
## TODO
- [ ] Text to audio
- [ ] Audio to text
- [ ] Video to text
- [ ] Add embeddings to Text module
- [ ] Typesense Search Adapter
- [ ] Streaming audio and video support
- [ ] Agents
- [ ] Implement other file types
- [ ] Backfill tests
- [ ] and much much more...
Documentation can be generated with [ExDoc](https://github.com/elixir-lang/ex_doc)
and published on [HexDocs](https://hexdocs.pm). Once published, the docs can
be found at <https://hexdocs.pm/mulberry>.