From a4e209ac2b1f40a21fbe3619d4fbc598f05517f3 Mon Sep 17 00:00:00 2001 From: Adrian Liechti Date: Sun, 22 Sep 2024 23:37:39 +0200 Subject: [PATCH] use text for jina extractor --- pkg/extractor/jina/client.go | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/pkg/extractor/jina/client.go b/pkg/extractor/jina/client.go index 037cff6a..0d00ff7b 100644 --- a/pkg/extractor/jina/client.go +++ b/pkg/extractor/jina/client.go @@ -53,7 +53,7 @@ func (c *Client) Extract(ctx context.Context, input extractor.File, options *ext req, _ := http.NewRequestWithContext(ctx, "POST", c.url, jsonReader(body)) req.Header.Set("Content-Type", "application/json") - req.Header.Set("X-Return-Format", "markdown") + req.Header.Set("X-Return-Format", "text") if c.token != "" { req.Header.Set("Authorization", "Bearer "+c.token)