Skip to content

Commit

Permalink
Remove unnecessary spaces from document object’s page_content of Bili…
Browse files Browse the repository at this point in the history
…BiliLoader (langchain-ai#4619)

- Remove unnecessary spaces from document object’s page_content of
BiliBiliLoader
- Fix BiliBiliLoader document and test file
  • Loading branch information
liaokongVFX authored May 16, 2023
1 parent f47ec5b commit f7e3d97
Show file tree
Hide file tree
Showing 3 changed files with 8 additions and 8 deletions.
4 changes: 2 additions & 2 deletions docs/modules/indexes/document_loaders/examples/bilibili.ipynb
Original file line number Diff line number Diff line change
Expand Up @@ -5,7 +5,7 @@
"id": "66a7777e",
"metadata": {},
"source": [
"# Bilibili\n",
"# BiliBili\n",
"\n",
">[Bilibili](https://www.bilibili.tv/) is one of the most beloved long-form video sites in China.\n",
"\n",
Expand Down Expand Up @@ -35,7 +35,7 @@
},
"outputs": [],
"source": [
"from langchain.document_loaders.bilibili import BiliBiliLoader"
"from langchain.document_loaders import BiliBiliLoader"
]
},
{
Expand Down
10 changes: 5 additions & 5 deletions langchain/document_loaders/bilibili.py
Original file line number Diff line number Diff line change
Expand Up @@ -60,11 +60,11 @@ def _get_bilibili_subs_and_info(self, url: str) -> Tuple[str, dict]:
raw_sub_titles = json.loads(result.content)["body"]
raw_transcript = " ".join([c["content"] for c in raw_sub_titles])

raw_transcript_with_meta_info = f"""
Video Title: {video_info['title']},
description: {video_info['desc']}\n
Transcript: {raw_transcript}
"""
raw_transcript_with_meta_info = (
f"Video Title: {video_info['title']},"
f"description: {video_info['desc']}\n\n"
f"Transcript: {raw_transcript}"
)
return raw_transcript_with_meta_info, video_info
else:
raw_transcript = ""
Expand Down
2 changes: 1 addition & 1 deletion tests/integration_tests/document_loaders/test_bilibili.py
Original file line number Diff line number Diff line change
@@ -1,4 +1,4 @@
from langchain.document_loaders.bilibili import BiliBiliLoader
from langchain.document_loaders import BiliBiliLoader


def test_bilibili_loader() -> None:
Expand Down

0 comments on commit f7e3d97

Please sign in to comment.