| 1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465 |
- """RAG (检索增强生成) 模块
- 合并了 GraphRAG 能力:
- - loader:文件加载/分块(含PDF、语言标注、去重)
- - embedding/cache:嵌入与SQLite缓存,默认哈希回退
- - vector search:Qdrant召回
- - rank/merge:融合排序与片段合并
- """
- # 说明:原先的 .embeddings 已合并到上级目录的 memory/embedding.py
- # 这里做兼容导出,避免历史引用报错。
- from ..embedding import (
- EmbeddingModel,
- LocalTransformerEmbedding,
- TFIDFEmbedding,
- create_embedding_model,
- create_embedding_model_with_fallback,
- )
- from .document import Document, DocumentProcessor
- from .pipeline import (
- load_and_chunk_texts,
- build_graph_from_chunks,
- index_chunks,
- embed_query,
- search_vectors,
- rank,
- merge_snippets,
- rerank_with_cross_encoder,
- expand_neighbors_from_pool,
- compute_graph_signals_from_pool,
- merge_snippets_grouped,
- search_vectors_expanded,
- compress_ranked_items,
- tldr_summarize,
- )
- # 兼容旧类名(历史代码中可能从此处导入)
- SentenceTransformerEmbedding = LocalTransformerEmbedding
- HuggingFaceEmbedding = LocalTransformerEmbedding
- __all__ = [
- "EmbeddingModel",
- "LocalTransformerEmbedding",
- "SentenceTransformerEmbedding", # 兼容别名
- "HuggingFaceEmbedding", # 兼容别名
- "TFIDFEmbedding",
- "create_embedding_model",
- "create_embedding_model_with_fallback",
- "Document",
- "DocumentProcessor",
- "load_and_chunk_texts",
- "build_graph_from_chunks",
- "index_chunks",
- "embed_query",
- "search_vectors",
- "rank",
- "merge_snippets",
- "rerank_with_cross_encoder",
- "expand_neighbors_from_pool",
- "compute_graph_signals_from_pool",
- "merge_snippets_grouped",
- "search_vectors_expanded",
- "compress_ranked_items",
- "tldr_summarize",
- ]
|