llm-bucket 0.2.0

Open source core logic and pipelines for synchronising a bucket with content for LLMs to consume with RAG.
Documentation
# config.yaml.example
# Example configuration for llm-bucket sync CLI
# Copy this file to `config.yaml`, fill in your real values, and keep the real config.yaml out of git!
#
# NOTE: Never commit secrets or production values.

download:
  output_dir: ./tmp/exports                  # Directory where source(s) will be checked out & processed
  sources:
    - type: git
      repo_url: "git@github.com:kasbuunk/llm-bucket.git" # Replace with your repo URL
      reference: main                        # (optional) branch, tag, or commit. Use "main" if unsure.

    - type: confluence
      base_url: "https://yourcompany.atlassian.net/wiki" # Replace with your Confluence base URL
      space_key: "MKTG"                                 # Replace with your target space key

process:
  kind: FlattenFiles                         # "FlattenFiles" or "ReadmeToPDF" (see README for other modes)

# To use:
#   cp config.yaml.example config.yaml
#   Edit config.yaml as needed.
#   Add "config.yaml" to your .gitignore!