RAGFlow go API server (#13240)

# RAGFlow Go Implementation Plan 🚀

This repository tracks the progress of porting RAGFlow to Go. We'll
implement core features and provide performance comparisons between
Python and Go versions.

## Implementation Checklist

- [x] User Management APIs
- [x] Dataset Management Operations
- [x] Retrieval Test
- [x] Chat Management Operations
- [x] Infinity Go SDK

---------

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
Co-authored-by: Yingfeng Zhang <yingfeng.zhang@gmail.com>
This commit is contained in:
Jin Hai
2026-03-04 19:17:16 +08:00
committed by GitHub
parent 2508c46c8f
commit 70e9743ef1
257 changed files with 80490 additions and 6 deletions

View File

@ -0,0 +1,225 @@
// C API implementation for RAGAnalyzer
#include "rag_analyzer_c_api.h"
#include "rag_analyzer.h"
#include "term.h"
#include <cstring>
#include <string>
#include <vector>
extern "C" {
RAGAnalyzerHandle RAGAnalyzer_Create(const char* path) {
if (!path) return nullptr;
try {
RAGAnalyzer* analyzer = new RAGAnalyzer(std::string(path));
return static_cast<RAGAnalyzerHandle>(analyzer);
} catch (...) {
return nullptr;
}
}
void RAGAnalyzer_Destroy(RAGAnalyzerHandle handle) {
if (handle) {
RAGAnalyzer* analyzer = static_cast<RAGAnalyzer*>(handle);
delete analyzer;
}
}
int RAGAnalyzer_Load(RAGAnalyzerHandle handle) {
if (!handle) return -1;
RAGAnalyzer* analyzer = static_cast<RAGAnalyzer*>(handle);
return analyzer->Load();
}
void RAGAnalyzer_SetFineGrained(RAGAnalyzerHandle handle, bool fine_grained) {
if (!handle) return;
RAGAnalyzer* analyzer = static_cast<RAGAnalyzer*>(handle);
analyzer->SetFineGrained(fine_grained);
}
void RAGAnalyzer_SetEnablePosition(RAGAnalyzerHandle handle, bool enable_position) {
if (!handle) return;
RAGAnalyzer* analyzer = static_cast<RAGAnalyzer*>(handle);
analyzer->SetEnablePosition(enable_position);
}
int RAGAnalyzer_Analyze(RAGAnalyzerHandle handle, const char* text, RAGTokenCallback callback) {
if (!handle || !text || !callback) return -1;
RAGAnalyzer* analyzer = static_cast<RAGAnalyzer*>(handle);
Term input;
input.text_ = std::string(text);
TermList output;
// Use the analyzer's internal state for fine_grained and enable_position
int ret = analyzer->Analyze(input, output, analyzer->fine_grained_, analyzer->enable_position_);
if (ret != 0) {
return ret;
}
// Call callback for each token
for (const auto& term : output) {
callback(term.text_.c_str(), term.text_.length(), term.word_offset_, term.end_offset_);
}
return 0;
}
char* RAGAnalyzer_Tokenize(RAGAnalyzerHandle handle, const char* text) {
if (!handle || !text) return nullptr;
RAGAnalyzer* analyzer = static_cast<RAGAnalyzer*>(handle);
std::string result = analyzer->Tokenize(std::string(text));
// Allocate memory for C string
char* c_result = static_cast<char*>(malloc(result.size() + 1));
if (c_result) {
std::memcpy(c_result, result.c_str(), result.size() + 1);
}
return c_result;
}
RAGTokenList* RAGAnalyzer_TokenizeWithPosition(RAGAnalyzerHandle handle, const char* text) {
if (!handle || !text) return nullptr;
RAGAnalyzer* analyzer = static_cast<RAGAnalyzer*>(handle);
Term input;
input.text_ = std::string(text);
TermList output;
// Pass fine_grained and enable_position=true to get position information
analyzer->Analyze(input, output, analyzer->fine_grained_, true);
// Allocate memory for the token list structure
RAGTokenList* token_list = static_cast<RAGTokenList*>(malloc(sizeof(RAGTokenList)));
if (!token_list) {
return nullptr;
}
// Allocate memory for the tokens array
token_list->tokens = static_cast<RAGTokenWithPosition*>(
malloc(sizeof(RAGTokenWithPosition) * output.size())
);
if (!token_list->tokens) {
free(token_list);
return nullptr;
}
token_list->count = static_cast<uint32_t>(output.size());
// Fill in the tokens
for (size_t i = 0; i < output.size(); ++i) {
// Allocate memory for the text and copy it
token_list->tokens[i].text = static_cast<char*>(
malloc(output[i].text_.size() + 1)
);
if (token_list->tokens[i].text) {
std::memcpy(token_list->tokens[i].text,
output[i].text_.c_str(),
output[i].text_.size() + 1);
}
token_list->tokens[i].offset = output[i].word_offset_;
token_list->tokens[i].end_offset = output[i].end_offset_;
}
return token_list;
}
void RAGAnalyzer_FreeTokenList(RAGTokenList* token_list) {
if (!token_list) return;
if (token_list->tokens) {
for (uint32_t i = 0; i < token_list->count; ++i) {
if (token_list->tokens[i].text) {
free(token_list->tokens[i].text);
}
}
free(token_list->tokens);
}
free(token_list);
}
// Helper functions to access token fields
const char* RAGToken_GetText(void* token) {
if (!token) return nullptr;
RAGTokenWithPosition* t = static_cast<RAGTokenWithPosition*>(token);
return t->text;
}
uint32_t RAGToken_GetOffset(void* token) {
if (!token) return 0;
RAGTokenWithPosition* t = static_cast<RAGTokenWithPosition*>(token);
return t->offset;
}
uint32_t RAGToken_GetEndOffset(void* token) {
if (!token) return 0;
RAGTokenWithPosition* t = static_cast<RAGTokenWithPosition*>(token);
return t->end_offset;
}
char* RAGAnalyzer_FineGrainedTokenize(RAGAnalyzerHandle handle, const char* tokens) {
if (!handle || !tokens) return nullptr;
RAGAnalyzer* analyzer = static_cast<RAGAnalyzer*>(handle);
std::vector<std::string> result;
analyzer->FineGrainedTokenize(std::string(tokens), result);
// Join results with space
std::string result_str;
for (size_t i = 0; i < result.size(); ++i) {
if (i > 0) result_str += " ";
result_str += result[i];
}
// Allocate memory for C string
char* c_result = static_cast<char*>(malloc(result_str.size() + 1));
if (c_result) {
std::memcpy(c_result, result_str.c_str(), result_str.size() + 1);
}
return c_result;
}
int32_t RAGAnalyzer_GetTermFreq(RAGAnalyzerHandle handle, const char* term) {
if (!handle || !term) return 0;
RAGAnalyzer* analyzer = static_cast<RAGAnalyzer*>(handle);
return analyzer->Freq(term);
}
char* RAGAnalyzer_GetTermTag(RAGAnalyzerHandle handle, const char* term) {
if (!handle || !term) return nullptr;
RAGAnalyzer* analyzer = static_cast<RAGAnalyzer*>(handle);
std::string tag_result = analyzer->Tag(term);
if (tag_result.empty()) {
return nullptr;
}
// Allocate memory for C string
char* c_result = static_cast<char*>(malloc(tag_result.size() + 1));
if (c_result) {
std::memcpy(c_result, tag_result.c_str(), tag_result.size() + 1);
}
return c_result;
}
RAGAnalyzerHandle RAGAnalyzer_Copy(RAGAnalyzerHandle handle) {
if (!handle) return nullptr;
try {
RAGAnalyzer* original = static_cast<RAGAnalyzer*>(handle);
RAGAnalyzer* copy = new RAGAnalyzer(*original);
return static_cast<RAGAnalyzerHandle>(copy);
} catch (...) {
return nullptr;
}
}
} // extern "C"