\n",
" \n",
- " | 32366 | \n",
- " vho70jcx | \n",
- " f056da9c64fbf00a4645ae326e8a4339d015d155 | \n",
- " biorxiv | \n",
- " SIANN: Strain Identification by Alignment to N... | \n",
- " 10.1101/001727 | \n",
- " NaN | \n",
- " NaN | \n",
- " biorxiv | \n",
- " Next-generation sequencing is increasingly bei... | \n",
- " 2014-01-10 | \n",
- " Samuel Minot; Stephen D Turner; Krista L Ternu... | \n",
- " NaN | \n",
- " NaN | \n",
- " NaN | \n",
- " True | \n",
- " False | \n",
- " biorxiv_medrxiv | \n",
- " https://doi.org/10.1101/001727 | \n",
+ " count | \n",
+ " 1934.000000 | \n",
+ " 1934.000000 | \n",
"
\n",
" \n",
- " | 32367 | \n",
- " i9tbix2v | \n",
- " daf32e013d325a6feb80e83d15aabc64a48fae33 | \n",
- " biorxiv | \n",
- " Spatial epidemiology of networked metapopulati... | \n",
- " 10.1101/003889 | \n",
- " NaN | \n",
- " NaN | \n",
- " biorxiv | \n",
- " An emerging disease is one infectious epidemic... | \n",
- " 2014-06-04 | \n",
- " Lin WANG; Xiang Li | \n",
- " NaN | \n",
- " NaN | \n",
- " NaN | \n",
- " True | \n",
- " False | \n",
- " biorxiv_medrxiv | \n",
- " https://doi.org/10.1101/003889 | \n",
+ " mean | \n",
+ " 222.068769 | \n",
+ " 2986.755429 | \n",
"
\n",
" \n",
- " | 32368 | \n",
- " 62gfisc6 | \n",
- " f33c6d94b0efaa198f8f3f20e644625fa3fe10d2 | \n",
- " biorxiv | \n",
- " Sequencing of the human IG light chain loci fr... | \n",
- " 10.1101/006866 | \n",
- " NaN | \n",
- " NaN | \n",
- " biorxiv | \n",
- " Germline variation at immunoglobulin gene (IG)... | \n",
- " 2014-07-03 | \n",
- " Corey T Watson; Karyn Meltz Steinberg; Tina A ... | \n",
- " NaN | \n",
- " NaN | \n",
- " NaN | \n",
- " True | \n",
- " False | \n",
- " biorxiv_medrxiv | \n",
- " https://doi.org/10.1101/006866 | \n",
+ " std | \n",
+ " 92.719230 | \n",
+ " 2207.443432 | \n",
"
\n",
" \n",
- " | 32369 | \n",
- " 058r9486 | \n",
- " 4da8a87e614373d56070ed272487451266dce919 | \n",
- " biorxiv | \n",
- " Bayesian mixture analysis for metagenomic comm... | \n",
- " 10.1101/007476 | \n",
- " NaN | \n",
- " NaN | \n",
- " biorxiv | \n",
- " Deep sequencing of clinical samples is now an ... | \n",
- " 2014-07-25 | \n",
- " Sofia Morfopoulou; Vincent Plagnol | \n",
- " NaN | \n",
- " NaN | \n",
- " NaN | \n",
- " True | \n",
- " False | \n",
- " biorxiv_medrxiv | \n",
- " https://doi.org/10.1101/007476 | \n",
+ " min | \n",
+ " 1.000000 | \n",
+ " 43.000000 | \n",
+ "
\n",
+ " \n",
+ " | 25% | \n",
+ " 152.000000 | \n",
+ " 1616.750000 | \n",
+ "
\n",
+ " \n",
+ " | 50% | \n",
+ " 216.000000 | \n",
+ " 2539.000000 | \n",
+ "
\n",
+ " \n",
+ " | 75% | \n",
+ " 270.000000 | \n",
+ " 3748.500000 | \n",
"
\n",
" \n",
- " | 32370 | \n",
- " wich35l7 | \n",
- " eccef80cfbe078235df22398f195d5db462d8000 | \n",
- " biorxiv | \n",
- " Mapping a viral phylogeny onto outbreak trees ... | \n",
- " 10.1101/010389 | \n",
- " NaN | \n",
- " NaN | \n",
- " biorxiv | \n",
- " Developing methods to reconstruct transmission... | \n",
- " 2014-11-11 | \n",
- " Stephen P Velsko; Jonathan E Allen | \n",
- " NaN | \n",
- " NaN | \n",
- " NaN | \n",
- " True | \n",
- " False | \n",
- " biorxiv_medrxiv | \n",
- " https://doi.org/10.1101/010389 | \n",
+ " max | \n",
+ " 678.000000 | \n",
+ " 44519.000000 | \n",
"
\n",
" \n",
"\n",
""
],
"text/plain": [
- " cord_uid sha source_x \\\n",
- "32366 vho70jcx f056da9c64fbf00a4645ae326e8a4339d015d155 biorxiv \n",
- "32367 i9tbix2v daf32e013d325a6feb80e83d15aabc64a48fae33 biorxiv \n",
- "32368 62gfisc6 f33c6d94b0efaa198f8f3f20e644625fa3fe10d2 biorxiv \n",
- "32369 058r9486 4da8a87e614373d56070ed272487451266dce919 biorxiv \n",
- "32370 wich35l7 eccef80cfbe078235df22398f195d5db462d8000 biorxiv \n",
- "\n",
- " title doi \\\n",
- "32366 SIANN: Strain Identification by Alignment to N... 10.1101/001727 \n",
- "32367 Spatial epidemiology of networked metapopulati... 10.1101/003889 \n",
- "32368 Sequencing of the human IG light chain loci fr... 10.1101/006866 \n",
- "32369 Bayesian mixture analysis for metagenomic comm... 10.1101/007476 \n",
- "32370 Mapping a viral phylogeny onto outbreak trees ... 10.1101/010389 \n",
- "\n",
- " pmcid pubmed_id license \\\n",
- "32366 NaN NaN biorxiv \n",
- "32367 NaN NaN biorxiv \n",
- "32368 NaN NaN biorxiv \n",
- "32369 NaN NaN biorxiv \n",
- "32370 NaN NaN biorxiv \n",
- "\n",
- " abstract publish_time \\\n",
- "32366 Next-generation sequencing is increasingly bei... 2014-01-10 \n",
- "32367 An emerging disease is one infectious epidemic... 2014-06-04 \n",
- "32368 Germline variation at immunoglobulin gene (IG)... 2014-07-03 \n",
- "32369 Deep sequencing of clinical samples is now an ... 2014-07-25 \n",
- "32370 Developing methods to reconstruct transmission... 2014-11-11 \n",
- "\n",
- " authors journal \\\n",
- "32366 Samuel Minot; Stephen D Turner; Krista L Ternu... NaN \n",
- "32367 Lin WANG; Xiang Li NaN \n",
- "32368 Corey T Watson; Karyn Meltz Steinberg; Tina A ... NaN \n",
- "32369 Sofia Morfopoulou; Vincent Plagnol NaN \n",
- "32370 Stephen P Velsko; Jonathan E Allen NaN \n",
- "\n",
- " Microsoft Academic Paper ID WHO #Covidence has_pdf_parse \\\n",
- "32366 NaN NaN True \n",
- "32367 NaN NaN True \n",
- "32368 NaN NaN True \n",
- "32369 NaN NaN True \n",
- "32370 NaN NaN True \n",
- "\n",
- " has_pmc_xml_parse full_text_file url \n",
- "32366 False biorxiv_medrxiv https://doi.org/10.1101/001727 \n",
- "32367 False biorxiv_medrxiv https://doi.org/10.1101/003889 \n",
- "32368 False biorxiv_medrxiv https://doi.org/10.1101/006866 \n",
- "32369 False biorxiv_medrxiv https://doi.org/10.1101/007476 \n",
- "32370 False biorxiv_medrxiv https://doi.org/10.1101/010389 "
+ " abstract_word_count body_word_count\n",
+ "count 1934.000000 1934.000000\n",
+ "mean 222.068769 2986.755429\n",
+ "std 92.719230 2207.443432\n",
+ "min 1.000000 43.000000\n",
+ "25% 152.000000 1616.750000\n",
+ "50% 216.000000 2539.000000\n",
+ "75% 270.000000 3748.500000\n",
+ "max 678.000000 44519.000000"
]
},
- "execution_count": 41,
+ "execution_count": 137,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
- "bio_clean.head()"
- ]
- },
- {
- "cell_type": "code",
- "execution_count": 42,
- "metadata": {},
- "outputs": [
- {
- "name": "stdout",
- "output_type": "stream",
- "text": [
- "['biorxiv'] [nan] [nan] [nan] [nan]\n"
- ]
- }
- ],
- "source": [
- "print(bio_clean['source_x'].unique(),\n",
- "bio_clean['pmcid'].unique(),\n",
- "bio_clean['pubmed_id'].unique(),\n",
- "bio_clean['Microsoft Academic Paper ID'].unique(),\n",
- "bio_clean['WHO #Covidence'].unique())"
- ]
- },
- {
- "cell_type": "code",
- "execution_count": 43,
- "metadata": {},
- "outputs": [],
- "source": [
- "bio_slim = bio_clean.drop(['Microsoft Academic Paper ID','WHO #Covidence','pubmed_id','pmcid'], axis = 1)"
- ]
- },
- {
- "cell_type": "code",
- "execution_count": 44,
- "metadata": {},
- "outputs": [],
- "source": [
- "bio_slim = bio_slim.drop(['url','doi','license','full_text_file'],axis =1 )"
- ]
- },
- {
- "cell_type": "code",
- "execution_count": 45,
- "metadata": {},
- "outputs": [],
- "source": [
- "bio_slim = bio_slim[~bio_slim.has_pdf_parse.isin(['False'])]"
+ "df_covid.describe()"
]
},
{
- "cell_type": "code",
- "execution_count": 46,
+ "cell_type": "markdown",
"metadata": {},
- "outputs": [],
"source": [
- "bio_slim =bio_slim.loc[~(bio_slim.abstract.isnull())]"
+ "We now clean the text data so that our key words are clear and we do not have to worry about details we are not concerned about. [ref1](https://towardsdatascience.com/nlp-text-preprocessing-a-practical-guide-and-template-d80874676e79) [ref2](https://www.geeksforgeeks.org/text-preprocessing-in-python-set-1/)"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
- "As we had seen at the send of section 2.3, all_json contains the paths of all the json files(i.e. the articles) in it.\n",
- "Now we should load this into a dataframe for it to be queryable"
+ "Firstly By now looking at the abstract columns, we must notice that the text scraped from these articles is not perfect.\n",
+ "\n",
+ "For example, many of the abstracts start with the word *Abstract* glued to the beginning of the first word of the real abstract body. "
]
},
{
"cell_type": "code",
- "execution_count": 47,
+ "execution_count": 138,
"metadata": {},
"outputs": [
{
"data": {
+ "text/html": [
+ "\n",
" \n",
" | 0 | \n",
- " e6d882be4961d1bdd7507b4a29d86b650de0895d | \n",
- " Middle East Respiratory Syndrome coronavirus (... | \n",
- " Middle East respiratory syndrome coronavirus (... | \n",
- " Oh, Myoung-don. Park, Wan Beom... | \n",
- " (Middle East respiratory syndrome: what we lea... | \n",
- " 123 | \n",
- " 3907 | \n",
+ " 0015023cc06b5362d332b3baf348d11567ca2fbb | \n",
+ " the positive stranded rna genomes of picornavi... | \n",
+ " vp3, and vp0 (which is further processed to vp... | \n",
+ " Joseph C. Ward. Lidia Lasecka-Dykes... | \n",
+ " (The RNA pseudoknots in foot-and-mouth disease... | \n",
+ " 194 | \n",
+ " 1709 | \n",
"
\n",
" \n",
" | 1 | \n",
- " d0c4236f95ba2b3d5cdc71fde524b26262f05dd3 | \n",
- " In theoretical physics, there exist two basic ... | \n",
- " In theoretical physics, there exist two basic ... | \n",
- " Zhang, Ren. Zhang, Chun-Ting | \n",
- " (A Brief Review: The Z-curve Theory and its Ap... | \n",
- " 169 | \n",
- " 6359 | \n",
+ " 00340eea543336d54adda18236424de6a5e91c9d | \n",
+ " during the past three months, a new coronaviru... | \n",
+ " in december 2019, a novel coronavirus, sars-co... | \n",
+ " Carla Mavian. Simone Marini... | \n",
+ " (Regaining perspective on SARS-CoV-2 molecular... | \n",
+ " 138 | \n",
+ " 2487 | \n",
"
\n",
" \n",
" | 2 | \n",
- " d24afd9ee025b53015824be203db539009964fbd | \n",
- " BACKGROUND: The aim of this research was to ev... | \n",
- " In view of the role of thin-section CT scannin... | \n",
- " Xing, Zhi-Heng. Sun, Xin... | \n",
- " (Thin-section Computed Tomography Detects Long... | \n",
- " 326 | \n",
- " 2937 | \n",
+ " 004f0f8bb66cf446678dc13cf2701feec4f36d76 | \n",
+ " we integrate the human movement and healthcare... | \n",
+ " the 2019-ncov epidemic has spread across china... | \n",
+ " Hanchu Zhou. Jianan Yang... | \n",
+ " (Healthcare-resource-adjusted vulnerabilities ... | \n",
+ " 34 | \n",
+ " 749 | \n",
"
\n",
" \n",
" | 3 | \n",
- " 4a3941003ea2673397975ae8bc2536ad59f789e5 | \n",
- " INTRODUCTION: The Major Incident Hospital (MIH... | \n",
- " injury. Medical management does not simply inv... | \n",
- " Marres, G. M. H.. van der Eijk, J.... | \n",
- " (Evaluation of admissions to the Major Inciden... | \n",
- " 264 | \n",
- " 4830 | \n",
+ " 005d189d5bd7ac01aee65e934fd3d5186a3f7b27 | \n",
+ " the rapid outbreak of the new coronavirus (cov... | \n",
+ " the outbreak of infectious diseases has always... | \n",
+ " Behzad Pirouz. Amirsina Golmohammadi... | \n",
+ " (Relationship between Average Daily Temperatur... | \n",
+ " 249 | \n",
+ " 2791 | \n",
"
\n",
" \n",
" | 4 | \n",
- " 905e2b35719215760ebed8f3e93fdf6ea8ec9bcf | \n",
- " Mice infected with the neurotropic JHM strain ... | \n",
- " 1. Frequently change and/or sterilize gloves t... | \n",
- " Carbajal, Kevin S.. Weinger, Jason G.... | \n",
- " (Surgical Transplantation of Mouse Neural Stem... | \n",
- " 137 | \n",
- " 1300 | \n",
- "
\n",
- " \n",
- " | 5 | \n",
- " 319004f23d1af4357edb2a3862f2619be23a21a6 | \n",
- " Diagnostics play a central role in the early d... | \n",
- " ► The Middle East respiratory syndrome-coronav... | \n",
- " Kelly-Cirino, Cassandra. Mazzola, Laura T... | \n",
- " (An updated roadmap for MERS-CoV research and ... | \n",
- " 212 | \n",
- " 3632 | \n",
- "
\n",
- " \n",
- " | 6 | \n",
- " 4971940ab68e4950b28410a208166900e8ba9c07 | \n",
- " Despite of the role of domestic dogs as reserv... | \n",
- " Since its initial identification in the late 1... | \n",
- " Vieira, Flávia V.. Hoffmann, Daniel J.... | \n",
- " (Circulation of canine parvovirus among dogs l... | \n",
- " 137 | \n",
- " 1519 | \n",
- "
\n",
- " \n",
- " | 7 | \n",
- " cae1f2fd5785845caa42d6497361eba46a68f11d | \n",
- " Diversity and plasticity are two hallmarks of ... | \n",
- " Macrophages were first identified by Elie Metc... | \n",
- " Liu, Yan-Cun. Zou, Xian-Biao... | \n",
- " (Macrophage Polarization in Inflammatory Disea... | \n",
- " 111 | \n",
- " 4608 | \n",
- "
\n",
- " \n",
- " | 8 | \n",
- " 2ffddf5caaef38207b58710a93ee8361518813c9 | \n",
- " This commentary offers suggestions for improvi... | \n",
- " I n the early 20th century, the new field of m... | \n",
- " Kahn, Laura H. | \n",
- " (The need for one health degree programs, 40) | \n",
- " 56 | \n",
- " 1177 | \n",
- "
\n",
- " \n",
- " | 9 | \n",
- " 4bae83e2441c3738d96e49c21c9be0a4c85b4a92 | \n",
- " The protective efficacy of DNA plasmids encodi... | \n",
- " Avian infectious bronchitis (IB) is a major di... | \n",
- " Yan, Fang. Zhao, Yujun... | \n",
- " (Protection of chickens against infectious bro... | \n",
- " 179 | \n",
- " 2987 | \n",
+ " 00911cf4f99a3d5ae5e5b787675646a743574496 | \n",
+ " abstrarctthe fast accumulation of viral metage... | \n",
+ " metagenomic sequencing, which allows us to dir... | \n",
+ " Jiayu Shang. Yanni Sun | \n",
+ " (CHEER: hierarCHical taxonomic classification ... | \n",
+ " 139 | \n",
+ " 5153 | \n",
"
\n",
" \n",
"\n",
@@ -3960,254 +2637,394 @@
],
"text/plain": [
" paper_id \\\n",
- "0 e6d882be4961d1bdd7507b4a29d86b650de0895d \n",
- "1 d0c4236f95ba2b3d5cdc71fde524b26262f05dd3 \n",
- "2 d24afd9ee025b53015824be203db539009964fbd \n",
- "3 4a3941003ea2673397975ae8bc2536ad59f789e5 \n",
- "4 905e2b35719215760ebed8f3e93fdf6ea8ec9bcf \n",
- "5 319004f23d1af4357edb2a3862f2619be23a21a6 \n",
- "6 4971940ab68e4950b28410a208166900e8ba9c07 \n",
- "7 cae1f2fd5785845caa42d6497361eba46a68f11d \n",
- "8 2ffddf5caaef38207b58710a93ee8361518813c9 \n",
- "9 4bae83e2441c3738d96e49c21c9be0a4c85b4a92 \n",
+ "0 0015023cc06b5362d332b3baf348d11567ca2fbb \n",
+ "1 00340eea543336d54adda18236424de6a5e91c9d \n",
+ "2 004f0f8bb66cf446678dc13cf2701feec4f36d76 \n",
+ "3 005d189d5bd7ac01aee65e934fd3d5186a3f7b27 \n",
+ "4 00911cf4f99a3d5ae5e5b787675646a743574496 \n",
"\n",
" abstract \\\n",
- "0 Middle East Respiratory Syndrome coronavirus (... \n",
- "1 In theoretical physics, there exist two basic ... \n",
- "2 BACKGROUND: The aim of this research was to ev... \n",
- "3 INTRODUCTION: The Major Incident Hospital (MIH... \n",
- "4 Mice infected with the neurotropic JHM strain ... \n",
- "5 Diagnostics play a central role in the early d... \n",
- "6 Despite of the role of domestic dogs as reserv... \n",
- "7 Diversity and plasticity are two hallmarks of ... \n",
- "8 This commentary offers suggestions for improvi... \n",
- "9 The protective efficacy of DNA plasmids encodi... \n",
+ "0 the positive stranded rna genomes of picornavi... \n",
+ "1 during the past three months, a new coronaviru... \n",
+ "2 we integrate the human movement and healthcare... \n",
+ "3 the rapid outbreak of the new coronavirus (cov... \n",
+ "4 abstrarctthe fast accumulation of viral metage... \n",
"\n",
" body_text \\\n",
- "0 Middle East respiratory syndrome coronavirus (... \n",
- "1 In theoretical physics, there exist two basic ... \n",
- "2 In view of the role of thin-section CT scannin... \n",
- "3 injury. Medical management does not simply inv... \n",
- "4 1. Frequently change and/or sterilize gloves t... \n",
- "5 ► The Middle East respiratory syndrome-coronav... \n",
- "6 Since its initial identification in the late 1... \n",
- "7 Macrophages were first identified by Elie Metc... \n",
- "8 I n the early 20th century, the new field of m... \n",
- "9 Avian infectious bronchitis (IB) is a major di... \n",
+ "0 vp3, and vp0 (which is further processed to vp... \n",
+ "1 in december 2019, a novel coronavirus, sars-co... \n",
+ "2 the 2019-ncov epidemic has spread across china... \n",
+ "3 the outbreak of infectious diseases has always... \n",
+ "4 metagenomic sequencing, which allows us to dir... \n",
"\n",
- " authors \\\n",
- "0 Oh, Myoung-don. Park, Wan Beom... \n",
- "1 Zhang, Ren. Zhang, Chun-Ting \n",
- "2 Xing, Zhi-Heng. Sun, Xin... \n",
- "3 Marres, G. M. H.. van der Eijk, J.... \n",
- "4 Carbajal, Kevin S.. Weinger, Jason G.... \n",
- "5 Kelly-Cirino, Cassandra. Mazzola, Laura T... \n",
- "6 Vieira, Flávia V.. Hoffmann, Daniel J.... \n",
- "7 Liu, Yan-Cun. Zou, Xian-Biao... \n",
- "8 Kahn, Laura H. \n",
- "9 Yan, Fang. Zhao, Yujun... \n",
+ " authors \\\n",
+ "0 Joseph C. Ward. Lidia Lasecka-Dykes... \n",
+ "1 Carla Mavian. Simone Marini... \n",
+ "2 Hanchu Zhou. Jianan Yang... \n",
+ "3 Behzad Pirouz. Amirsina Golmohammadi... \n",
+ "4 Jiayu Shang. Yanni Sun \n",
"\n",
" title abstract_word_count \\\n",
- "0 (Middle East respiratory syndrome: what we lea... 123 \n",
- "1 (A Brief Review: The Z-curve Theory and its Ap... 169 \n",
- "2 (Thin-section Computed Tomography Detects Long... 326 \n",
- "3 (Evaluation of admissions to the Major Inciden... 264 \n",
- "4 (Surgical Transplantation of Mouse Neural Stem... 137 \n",
- "5 (An updated roadmap for MERS-CoV research and ... 212 \n",
- "6 (Circulation of canine parvovirus among dogs l... 137 \n",
- "7 (Macrophage Polarization in Inflammatory Disea... 111 \n",
- "8 (The need for one health degree programs, 40) 56 \n",
- "9 (Protection of chickens against infectious bro... 179 \n",
+ "0 (The RNA pseudoknots in foot-and-mouth disease... 194 \n",
+ "1 (Regaining perspective on SARS-CoV-2 molecular... 138 \n",
+ "2 (Healthcare-resource-adjusted vulnerabilities ... 34 \n",
+ "3 (Relationship between Average Daily Temperatur... 249 \n",
+ "4 (CHEER: hierarCHical taxonomic classification ... 139 \n",
"\n",
" body_word_count \n",
- "0 3907 \n",
- "1 6359 \n",
- "2 2937 \n",
- "3 4830 \n",
- "4 1300 \n",
- "5 3632 \n",
- "6 1519 \n",
- "7 4608 \n",
- "8 1177 \n",
- "9 2987 "
+ "0 1709 \n",
+ "1 2487 \n",
+ "2 749 \n",
+ "3 2791 \n",
+ "4 5153 "
]
},
- "execution_count": 51,
+ "execution_count": 141,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
- "df_covid['abstract_word_count'] = df_covid['abstract'].apply(lambda x: len(str(x).strip().split()))\n",
- "df_covid['body_word_count'] = df_covid['body_text'].apply(lambda x: len(str(x).strip().split()))\n",
- "df_covid.head(10)"
- ]
- },
- {
- "cell_type": "markdown",
- "metadata": {},
- "source": [
- "## Dataset statistics"
- ]
- },
- {
- "cell_type": "code",
- "execution_count": 74,
- "metadata": {},
- "outputs": [
- {
- "name": "stdout",
- "output_type": "stream",
- "text": [
- "Total number of words across all abstracts = 1383457. Average abstract length = 157.0147542844172\n"
- ]
- }
- ],
- "source": [
- "totalnumberofwords=df_covid['abstract_word_count'].sum()\n",
- "avg_abstract_len = totalnumberofwords/len(df_covid['abstract_word_count'])\n",
- "print(f'Total number of words across all abstracts = {totalnumberofwords}. Average abstract length = {avg_abstract_len}')"
+ "df_covid2['body_text'] = df_covid2['body_text'].apply(lambda x: str(x).lower())\n",
+ "df_covid2.head()"
]
},
{
"cell_type": "code",
- "execution_count": 52,
+ "execution_count": 142,
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
- "