forked from run-llama/llama-hub
-
Notifications
You must be signed in to change notification settings - Fork 0
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
Loader for Macrometa GDN (run-llama#484)
Loader for Macrometa GDN
- Loading branch information
1 parent
43cf9c3
commit a207c69
Showing
6 changed files
with
119 additions
and
4 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,17 @@ | ||
# Macrometa GDN Loader | ||
|
||
This loader takes in a Macrometa federation URL, API key, and collection name and returns a list of vectors. | ||
|
||
## Usage | ||
|
||
To use this loader, you need to pass the URL and API key through the class contructor, and then load the data using an array of collection names. | ||
|
||
```python | ||
from llama_index import download_loader | ||
|
||
MacrometaGDNReader = download_loader('MacrometaGDNReader') | ||
|
||
collections = ['test_collection'] | ||
loader = MacrometaGDNReader(url="https://api-macrometa.io",apikey="test") | ||
vectors= loader.load_data(collection_list=collections) | ||
``` |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1 @@ | ||
"""Init file.""" |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,90 @@ | ||
"""Macrometa GDN Reader.""" | ||
|
||
from typing import List | ||
import requests | ||
import json | ||
|
||
from llama_index.readers.base import BaseReader | ||
from llama_index.readers.schema.base import Document | ||
|
||
|
||
class MacrometaGDNReader(BaseReader): | ||
"""Macrometa GDN Reader. | ||
Reads vectors from Macrometa GDN | ||
""" | ||
|
||
def __init__(self, url: str, apikey: str): | ||
self.url = url | ||
self.apikey = apikey | ||
|
||
def load_data(self, collection_list: List[str]) -> List[Document]: | ||
"""Loads data from the input directory. | ||
Args: | ||
api: Macrometa GDN API key | ||
collection_name: Name of the collection to read from | ||
""" | ||
if collection_list is None: | ||
raise ValueError("Must specify collection name(s)") | ||
|
||
results = [] | ||
for collection_name in collection_list: | ||
collection = self._load_collection(collection_name) | ||
results.append( | ||
Document( | ||
text=collection, extra_info={"collection_name": collection_name} | ||
) | ||
) | ||
return results | ||
|
||
def _load_collection(self, collection_name: str) -> str: | ||
all_documents = [] | ||
"""Loads a collection from the database. | ||
Args: | ||
collection_name: Name of the collection to read from | ||
""" | ||
url = self.url + "/_fabric/_system/_api/cursor" | ||
headers = { | ||
"accept": "application/json", | ||
"content-type": "application/json", | ||
"Authorization": "apikey " + self.apikey, | ||
} | ||
|
||
data = { | ||
"batchSize": 1000, | ||
"ttl": 60, | ||
"query": "FOR doc IN " + collection_name + " RETURN doc", | ||
} | ||
response = requests.post(url, headers=headers, data=json.dumps(data)) | ||
response_json = response.json() | ||
if response.status_code == 201: | ||
all_documents.extend(response_json.get("result", [])) | ||
|
||
while response_json.get("hasMore"): | ||
cursor_id = response_json.get("id") | ||
|
||
next_url = self.url + "/_fabric/_system/_api/cursor/" + cursor_id | ||
|
||
response = requests.put(next_url, headers=headers) | ||
|
||
if response.status_code == 200: | ||
response_json = response.json() | ||
all_documents.extend(response_json.get("result", [])) | ||
else: | ||
print(f"Request failed with status code {response.status_code}") | ||
break | ||
else: | ||
print(f"Initial request failed with status code {response.status_code}") | ||
|
||
return str(all_documents) | ||
|
||
|
||
if __name__ == "__main__": | ||
reader = MacrometaGDNReader("https://api-anurag.eng.macrometa.io", "test") | ||
print(reader.load_data(collection_list=["test"])) |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,2 @@ | ||
requests | ||
json |