feat: add WikiData Component and depeciates the WikiData API tool component (#5872)
* update * [autofix.ci] apply automated fixes * Update test_wikidata_api.py * [autofix.ci] apply automated fixes * Update wikidata.py --------- Co-authored-by: autofix-ci[bot] <114827586+autofix-ci[bot]@users.noreply.github.com>
This commit is contained in:
parent
dcd68c5f4e
commit
229ba19a66
4 changed files with 252 additions and 136 deletions
|
|
@ -24,6 +24,7 @@ from .serp import SerpComponent
|
|||
from .serp_api import SerpAPIComponent
|
||||
from .tavily import TavilySearchComponent
|
||||
from .tavily_search import TavilySearchToolComponent
|
||||
from .wikidata import WikidataComponent
|
||||
from .wikidata_api import WikidataAPIComponent
|
||||
from .wikipedia import WikipediaComponent
|
||||
from .wikipedia_api import WikipediaAPIComponent
|
||||
|
|
@ -62,6 +63,7 @@ __all__ = [
|
|||
"TavilySearchComponent",
|
||||
"TavilySearchToolComponent",
|
||||
"WikidataAPIComponent",
|
||||
"WikidataComponent",
|
||||
"WikipediaAPIComponent",
|
||||
"WikipediaComponent",
|
||||
"WolframAlphaAPIComponent",
|
||||
|
|
|
|||
86
src/backend/base/langflow/components/tools/wikidata.py
Normal file
86
src/backend/base/langflow/components/tools/wikidata.py
Normal file
|
|
@ -0,0 +1,86 @@
|
|||
import httpx
|
||||
from httpx import HTTPError
|
||||
from langchain_core.tools import ToolException
|
||||
|
||||
from langflow.custom import Component
|
||||
from langflow.helpers.data import data_to_text
|
||||
from langflow.io import MultilineInput, Output
|
||||
from langflow.schema import Data
|
||||
from langflow.schema.message import Message
|
||||
|
||||
|
||||
class WikidataComponent(Component):
|
||||
display_name = "Wikidata"
|
||||
description = "Performs a search using the Wikidata API."
|
||||
icon = "Wikipedia"
|
||||
|
||||
inputs = [
|
||||
MultilineInput(
|
||||
name="query",
|
||||
display_name="Query",
|
||||
info="The text query for similarity search on Wikidata.",
|
||||
required=True,
|
||||
tool_mode=True,
|
||||
),
|
||||
]
|
||||
|
||||
outputs = [
|
||||
Output(display_name="Data", name="data", method="fetch_content"),
|
||||
Output(display_name="Message", name="text", method="fetch_content_text"),
|
||||
]
|
||||
|
||||
def fetch_content(self) -> list[Data]:
|
||||
try:
|
||||
# Define request parameters for Wikidata API
|
||||
params = {
|
||||
"action": "wbsearchentities",
|
||||
"format": "json",
|
||||
"search": self.query,
|
||||
"language": "en",
|
||||
}
|
||||
|
||||
# Send request to Wikidata API
|
||||
wikidata_api_url = "https://www.wikidata.org/w/api.php"
|
||||
response = httpx.get(wikidata_api_url, params=params)
|
||||
response.raise_for_status()
|
||||
response_json = response.json()
|
||||
|
||||
# Extract search results
|
||||
results = response_json.get("search", [])
|
||||
|
||||
if not results:
|
||||
return [Data(data={"error": "No search results found for the given query."})]
|
||||
|
||||
# Transform the API response into Data objects
|
||||
data = [
|
||||
Data(
|
||||
text=f"{result['label']}: {result.get('description', '')}",
|
||||
data={
|
||||
"label": result["label"],
|
||||
"id": result.get("id"),
|
||||
"url": result.get("url"),
|
||||
"description": result.get("description", ""),
|
||||
"concepturi": result.get("concepturi"),
|
||||
},
|
||||
)
|
||||
for result in results
|
||||
]
|
||||
|
||||
self.status = data
|
||||
except HTTPError as e:
|
||||
error_message = f"HTTP Error in Wikidata Search API: {e!s}"
|
||||
raise ToolException(error_message) from None
|
||||
except KeyError as e:
|
||||
error_message = f"Data parsing error in Wikidata API response: {e!s}"
|
||||
raise ToolException(error_message) from None
|
||||
except ValueError as e:
|
||||
error_message = f"Value error in Wikidata API: {e!s}"
|
||||
raise ToolException(error_message) from None
|
||||
else:
|
||||
return data
|
||||
|
||||
def fetch_content_text(self) -> Message:
|
||||
data = self.fetch_content()
|
||||
result_string = data_to_text("{text}", data)
|
||||
self.status = result_string
|
||||
return Message(text=result_string)
|
||||
|
|
@ -1,19 +1,63 @@
|
|||
from typing import Any
|
||||
|
||||
import httpx
|
||||
from httpx import HTTPError
|
||||
from langchain_core.tools import ToolException
|
||||
from langchain_core.tools import StructuredTool, ToolException
|
||||
from pydantic import BaseModel, Field
|
||||
|
||||
from langflow.custom import Component
|
||||
from langflow.helpers.data import data_to_text
|
||||
from langflow.io import MultilineInput, Output
|
||||
from langflow.base.langchain_utilities.model import LCToolComponent
|
||||
from langflow.field_typing import Tool
|
||||
from langflow.inputs import MultilineInput
|
||||
from langflow.schema import Data
|
||||
from langflow.schema.message import Message
|
||||
|
||||
|
||||
class WikidataAPIComponent(Component):
|
||||
display_name = "Wikidata API"
|
||||
class WikidataSearchSchema(BaseModel):
|
||||
query: str = Field(..., description="The search query for Wikidata")
|
||||
|
||||
|
||||
class WikidataAPIWrapper(BaseModel):
|
||||
"""Wrapper around Wikidata API."""
|
||||
|
||||
wikidata_api_url: str = "https://www.wikidata.org/w/api.php"
|
||||
|
||||
def results(self, query: str) -> list[dict[str, Any]]:
|
||||
# Define request parameters for Wikidata API
|
||||
params = {
|
||||
"action": "wbsearchentities",
|
||||
"format": "json",
|
||||
"search": query,
|
||||
"language": "en",
|
||||
}
|
||||
|
||||
# Send request to Wikidata API
|
||||
response = httpx.get(self.wikidata_api_url, params=params)
|
||||
response.raise_for_status()
|
||||
response_json = response.json()
|
||||
|
||||
# Extract and return search results
|
||||
return response_json.get("search", [])
|
||||
|
||||
def run(self, query: str) -> list[dict[str, Any]]:
|
||||
try:
|
||||
results = self.results(query)
|
||||
if results:
|
||||
return results
|
||||
|
||||
error_message = "No search results found for the given query."
|
||||
|
||||
raise ToolException(error_message)
|
||||
|
||||
except Exception as e:
|
||||
error_message = f"Error in Wikidata Search API: {e!s}"
|
||||
|
||||
raise ToolException(error_message) from e
|
||||
|
||||
|
||||
class WikidataAPIComponent(LCToolComponent):
|
||||
display_name = "Wikidata API [Deprecated]"
|
||||
description = "Performs a search using the Wikidata API."
|
||||
name = "WikidataAPI"
|
||||
icon = "Wikipedia"
|
||||
legacy = True
|
||||
|
||||
inputs = [
|
||||
MultilineInput(
|
||||
|
|
@ -21,67 +65,38 @@ class WikidataAPIComponent(Component):
|
|||
display_name="Query",
|
||||
info="The text query for similarity search on Wikidata.",
|
||||
required=True,
|
||||
tool_mode=True,
|
||||
),
|
||||
]
|
||||
|
||||
outputs = [
|
||||
Output(display_name="Data", name="data", method="fetch_content"),
|
||||
Output(display_name="Message", name="text", method="fetch_content_text"),
|
||||
]
|
||||
def build_tool(self) -> Tool:
|
||||
wrapper = WikidataAPIWrapper()
|
||||
|
||||
def fetch_content(self) -> list[Data]:
|
||||
try:
|
||||
# Define request parameters for Wikidata API
|
||||
params = {
|
||||
"action": "wbsearchentities",
|
||||
"format": "json",
|
||||
"search": self.query,
|
||||
"language": "en",
|
||||
}
|
||||
# Define the tool using StructuredTool and wrapper's run method
|
||||
tool = StructuredTool.from_function(
|
||||
name="wikidata_search_api",
|
||||
description="Perform similarity search on Wikidata API",
|
||||
func=wrapper.run,
|
||||
args_schema=WikidataSearchSchema,
|
||||
)
|
||||
|
||||
# Send request to Wikidata API
|
||||
wikidata_api_url = "https://www.wikidata.org/w/api.php"
|
||||
response = httpx.get(wikidata_api_url, params=params)
|
||||
response.raise_for_status()
|
||||
response_json = response.json()
|
||||
self.status = "Wikidata Search API Tool for Langchain"
|
||||
|
||||
# Extract search results
|
||||
results = response_json.get("search", [])
|
||||
return tool
|
||||
|
||||
if not results:
|
||||
return [Data(data={"error": "No search results found for the given query."})]
|
||||
def run_model(self) -> list[Data]:
|
||||
tool = self.build_tool()
|
||||
|
||||
# Transform the API response into Data objects
|
||||
data = [
|
||||
Data(
|
||||
text=f"{result['label']}: {result.get('description', '')}",
|
||||
data={
|
||||
"label": result["label"],
|
||||
"id": result.get("id"),
|
||||
"url": result.get("url"),
|
||||
"description": result.get("description", ""),
|
||||
"concepturi": result.get("concepturi"),
|
||||
},
|
||||
)
|
||||
for result in results
|
||||
]
|
||||
results = tool.run({"query": self.query})
|
||||
|
||||
self.status = data
|
||||
except HTTPError as e:
|
||||
error_message = f"HTTP Error in Wikidata Search API: {e!s}"
|
||||
raise ToolException(error_message) from None
|
||||
except KeyError as e:
|
||||
error_message = f"Data parsing error in Wikidata API response: {e!s}"
|
||||
raise ToolException(error_message) from None
|
||||
except ValueError as e:
|
||||
error_message = f"Value error in Wikidata API: {e!s}"
|
||||
raise ToolException(error_message) from None
|
||||
else:
|
||||
return data
|
||||
# Transform the API response into Data objects
|
||||
data = [
|
||||
Data(
|
||||
text=result["label"],
|
||||
metadata=result,
|
||||
)
|
||||
for result in results
|
||||
]
|
||||
|
||||
def fetch_content_text(self) -> Message:
|
||||
data = self.fetch_content()
|
||||
result_string = data_to_text("{text}", data)
|
||||
self.status = result_string
|
||||
return Message(text=result_string)
|
||||
self.status = data # type: ignore[assignment]
|
||||
|
||||
return data
|
||||
|
|
|
|||
|
|
@ -3,104 +3,117 @@ from unittest.mock import MagicMock, patch
|
|||
import httpx
|
||||
import pytest
|
||||
from langchain_core.tools import ToolException
|
||||
from langflow.components.tools import WikidataAPIComponent
|
||||
from langflow.components.tools import WikidataComponent
|
||||
from langflow.custom import Component
|
||||
from langflow.custom.utils import build_custom_component_template
|
||||
from langflow.schema import Data
|
||||
from langflow.schema.message import Message
|
||||
|
||||
|
||||
def test_wikidata_initialization():
|
||||
component = WikidataAPIComponent()
|
||||
assert component.display_name == "Wikidata API"
|
||||
assert component.description == "Performs a search using the Wikidata API."
|
||||
assert component.icon == "Wikipedia"
|
||||
# Import the base test class
|
||||
from tests.base import ComponentTestBaseWithoutClient
|
||||
|
||||
|
||||
def test_wikidata_template():
|
||||
wikidata = WikidataAPIComponent()
|
||||
component = Component(_code=wikidata._code)
|
||||
frontend_node, _ = build_custom_component_template(component)
|
||||
class TestWikidataComponent(ComponentTestBaseWithoutClient):
|
||||
@pytest.fixture
|
||||
def component_class(self):
|
||||
"""Fixture to create a WikidataComponent instance."""
|
||||
return WikidataComponent
|
||||
|
||||
# Verify basic structure
|
||||
assert isinstance(frontend_node, dict)
|
||||
@pytest.fixture
|
||||
def file_names_mapping(self):
|
||||
"""Return an empty list since this component doesn't have version-specific files."""
|
||||
return []
|
||||
|
||||
# Verify inputs
|
||||
assert "template" in frontend_node
|
||||
input_names = [input_["name"] for input_ in frontend_node["template"].values() if isinstance(input_, dict)]
|
||||
assert "query" in input_names
|
||||
@pytest.fixture
|
||||
def mock_query(self):
|
||||
"""Fixture to provide a default query."""
|
||||
return "test query"
|
||||
|
||||
def test_wikidata_initialization(self, component_class):
|
||||
component = component_class()
|
||||
assert component.display_name == "Wikidata"
|
||||
assert component.description == "Performs a search using the Wikidata API."
|
||||
assert component.icon == "Wikipedia"
|
||||
|
||||
@patch("langflow.components.tools.wikidata_api.httpx.get")
|
||||
def test_fetch_content_success(mock_httpx):
|
||||
component = WikidataAPIComponent()
|
||||
component.query = "test query"
|
||||
def test_wikidata_template(self, component_class):
|
||||
component = component_class()
|
||||
frontend_node, _ = build_custom_component_template(Component(_code=component._code))
|
||||
|
||||
# Mock successful API response
|
||||
mock_response = MagicMock()
|
||||
mock_response.json.return_value = {
|
||||
"search": [
|
||||
{
|
||||
"label": "Test Label",
|
||||
"id": "Q123",
|
||||
"url": "https://test.com",
|
||||
"description": "Test Description",
|
||||
"concepturi": "https://test.com/concept",
|
||||
}
|
||||
]
|
||||
}
|
||||
mock_httpx.return_value = mock_response
|
||||
# Verify basic structure
|
||||
assert isinstance(frontend_node, dict)
|
||||
|
||||
result = component.fetch_content()
|
||||
# Verify inputs
|
||||
assert "template" in frontend_node
|
||||
input_names = [input_["name"] for input_ in frontend_node["template"].values() if isinstance(input_, dict)]
|
||||
assert "query" in input_names
|
||||
|
||||
assert isinstance(result, list)
|
||||
assert len(result) == 1
|
||||
assert result[0].text == "Test Label: Test Description"
|
||||
assert result[0].data["label"] == "Test Label"
|
||||
assert result[0].data["id"] == "Q123"
|
||||
@patch("langflow.components.tools.wikidata_api.httpx.get")
|
||||
def test_fetch_content_success(self, mock_httpx, component_class, mock_query):
|
||||
component = component_class()
|
||||
component.query = mock_query
|
||||
|
||||
# Mock successful API response
|
||||
mock_response = MagicMock()
|
||||
mock_response.json.return_value = {
|
||||
"search": [
|
||||
{
|
||||
"label": "Test Label",
|
||||
"id": "Q123",
|
||||
"url": "https://test.com",
|
||||
"description": "Test Description",
|
||||
"concepturi": "https://test.com/concept",
|
||||
}
|
||||
]
|
||||
}
|
||||
mock_httpx.return_value = mock_response
|
||||
|
||||
@patch("langflow.components.tools.wikidata_api.httpx.get")
|
||||
def test_fetch_content_empty_response(mock_httpx):
|
||||
component = WikidataAPIComponent()
|
||||
component.query = "test query"
|
||||
result = component.fetch_content()
|
||||
|
||||
# Mock empty API response
|
||||
mock_response = MagicMock()
|
||||
mock_response.json.return_value = {"search": []}
|
||||
mock_httpx.return_value = mock_response
|
||||
assert isinstance(result, list)
|
||||
assert len(result) == 1
|
||||
assert result[0].text == "Test Label: Test Description"
|
||||
assert result[0].data["label"] == "Test Label"
|
||||
assert result[0].data["id"] == "Q123"
|
||||
|
||||
result = component.fetch_content()
|
||||
@patch("langflow.components.tools.wikidata_api.httpx.get")
|
||||
def test_fetch_content_empty_response(self, mock_httpx, component_class, mock_query):
|
||||
component = component_class()
|
||||
component.query = mock_query
|
||||
|
||||
assert isinstance(result, list)
|
||||
assert len(result) == 1
|
||||
assert "error" in result[0].data
|
||||
assert "No search results found" in result[0].data["error"]
|
||||
# Mock empty API response
|
||||
mock_response = MagicMock()
|
||||
mock_response.json.return_value = {"search": []}
|
||||
mock_httpx.return_value = mock_response
|
||||
|
||||
result = component.fetch_content()
|
||||
|
||||
@patch("langflow.components.tools.wikidata_api.httpx.get")
|
||||
def test_fetch_content_error_handling(mock_httpx):
|
||||
component = WikidataAPIComponent()
|
||||
component.query = "test query"
|
||||
assert isinstance(result, list)
|
||||
assert len(result) == 1
|
||||
assert "error" in result[0].data
|
||||
assert "No search results found" in result[0].data["error"]
|
||||
|
||||
# Mock HTTP error
|
||||
mock_httpx.side_effect = httpx.HTTPError("API Error")
|
||||
@patch("langflow.components.tools.wikidata_api.httpx.get")
|
||||
def test_fetch_content_error_handling(self, mock_httpx, component_class, mock_query):
|
||||
component = component_class()
|
||||
component.query = mock_query
|
||||
|
||||
with pytest.raises(ToolException):
|
||||
component.fetch_content()
|
||||
# Mock HTTP error
|
||||
mock_httpx.side_effect = httpx.HTTPError("API Error")
|
||||
|
||||
with pytest.raises(ToolException):
|
||||
component.fetch_content()
|
||||
|
||||
def test_fetch_content_text():
|
||||
component = WikidataAPIComponent()
|
||||
component.fetch_content = MagicMock(
|
||||
return_value=[
|
||||
Data(text="First result", data={"label": "Label 1"}),
|
||||
Data(text="Second result", data={"label": "Label 2"}),
|
||||
]
|
||||
)
|
||||
def test_fetch_content_text(self, component_class):
|
||||
component = component_class()
|
||||
component.fetch_content = MagicMock(
|
||||
return_value=[
|
||||
Data(text="First result", data={"label": "Label 1"}),
|
||||
Data(text="Second result", data={"label": "Label 2"}),
|
||||
]
|
||||
)
|
||||
|
||||
result = component.fetch_content_text()
|
||||
result = component.fetch_content_text()
|
||||
|
||||
assert isinstance(result, Message)
|
||||
assert "First result" in result.text
|
||||
assert "Second result" in result.text
|
||||
assert isinstance(result, Message)
|
||||
assert "First result" in result.text
|
||||
assert "Second result" in result.text
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue