diff --git a/zlu21.ipynb b/zlu21.ipynb new file mode 100644 index 0000000..a479e54 --- /dev/null +++ b/zlu21.ipynb @@ -0,0 +1,607 @@ +{ + "cells": [ + { + "cell_type": "code", + "execution_count": 1, + "metadata": {}, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "/usr/local/lib/python3.5/dist-packages/ipykernel_launcher.py:11: DeprecationWarning: insert is deprecated. Use insert_one or insert_many instead.\n", + " # This is added back by InteractiveShellApp.init_path()\n" + ] + }, + { + "data": { + "text/plain": [ + "ObjectId('5d7e6769e1eaff62f15de0d2')" + ] + }, + "execution_count": 1, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "import pprint\n", + "import re\n", + "import pymongo, json\n", + "\n", + "pp = pprint.PrettyPrinter(indent=1,width=65)\n", + "\n", + "client = pymongo.MongoClient (host=\"da1.eecs.utk.edu\")\n", + "db = client ['fdac19mp2']\n", + "coll = db ['audris']\n", + "# for each dataset\n", + "coll.insert_one ( { 'topic':'git URLs', 'first dataset': 'largest projects', 'license': 'NA', 'description': 'The list of projects on github with the largest number of starts', 'urls': [ 'url1', 'url2' ] } )\n" + ] + }, + { + "cell_type": "code", + "execution_count": 1, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "{'_id': ObjectId('5d7e6769e1eaff62f15de0d2'),\n", + " 'description': 'The list of projects on github with the '\n", + " 'largest number of starts',\n", + " 'first dataset': 'largest projects',\n", + " 'license': 'NA',\n", + " 'topic': 'git URLs',\n", + " 'urls': ['url1', 'url2']}\n", + "{'_id': ObjectId('5d7edc7c995d246453e1025b'),\n", + " 'description': 'The list of projects on github with the '\n", + " 'largest number of starts',\n", + " 'first dataset': 'largest projects',\n", + " 'license': 'NA',\n", + " 'topic': 'git URLs',\n", + " 'urls': ['url1', 'url2']}\n", + "{'_id': ObjectId('5d81827493569c62818e7979'),\n", + " 'description': 'The list of projects on github with the '\n", + " 'largest number of starts',\n", + " 'first dataset': 'largest projects',\n", + " 'license': 'NA',\n", + " 'topic': 'git URLs',\n", + " 'urls': ['url1', 'url2']}\n", + "{'_id': ObjectId('5d8193ebd4732fb4def4810e'),\n", + " 'description': 'The list of projects on github with the '\n", + " 'largest number of starts',\n", + " 'first dataset': 'largest projects',\n", + " 'license': 'NA',\n", + " 'topic': 'git URLs',\n", + " 'urls': ['https://www.kaggle.com/carolzhangdc/imdb-5000-movie-dataset#movie_metadata.csv']}\n", + "{'_id': ObjectId('5d81940ed4732fb4def48110'),\n", + " 'description': 'The list of projects on github with the '\n", + " 'largest number of starts',\n", + " 'first dataset': 'largest projects',\n", + " 'license': 'NA',\n", + " 'topic': 'git URLs',\n", + " 'urls': ['https://www.kaggle.com/carolzhangdc/imdb-5000-movie-dataset#movie_metadata.csv']}\n", + "{'_id': ObjectId('5d819429d4732fb4def48112'),\n", + " 'description': 'The list of projects on github with the '\n", + " 'largest number of starts',\n", + " 'first dataset': 'largest projects',\n", + " 'license': 'NA',\n", + " 'topic': 'IMDB dataset',\n", + " 'urls': ['https://www.kaggle.com/carolzhangdc/imdb-5000-movie-dataset#movie_metadata.csv']}\n", + "{'_id': ObjectId('5d824e392d00ba0dda2b8223'),\n", + " 'description': 'The list of projects on github with the '\n", + " 'largest number of starts',\n", + " 'first dataset': 'largest projects',\n", + " 'license': 'NA',\n", + " 'topic': 'git URLs',\n", + " 'urls': ['url1', 'url2']}\n", + "{'_id': ObjectId('5d84e383e2fb382bffecc36a'),\n", + " 'description': 'The list of projects on github with the '\n", + " 'largest number of starts',\n", + " 'first dataset': 'largest projects',\n", + " 'license': 'NA',\n", + " 'topic': 'git URLs',\n", + " 'urls': ['url1', 'url2']}\n", + "{'_id': ObjectId('5d84e4b13076d927920719fe'),\n", + " 'description': 'The list of projects on github with the '\n", + " 'largest number of starts',\n", + " 'first dataset': 'largest projects',\n", + " 'license': 'NA',\n", + " 'topic': 'git URLs',\n", + " 'urls': ['url1', 'url2']}\n", + "{'_id': ObjectId('5d86e5fe28b7b61598f33ffc'),\n", + " 'description': 'The list of projects on github with the '\n", + " 'largest number of starts',\n", + " 'first dataset': 'largest projects',\n", + " 'license': 'NA',\n", + " 'topic': 'git URLs',\n", + " 'urls': ['url1', 'url2']}\n", + "{'_id': ObjectId('5d86ec4928b7b61598f34009'),\n", + " 'description': 'The list of projects on github with the '\n", + " 'largest number of starts',\n", + " 'first dataset': 'largest projects',\n", + " 'license': 'NA',\n", + " 'topic': 'git URLs',\n", + " 'urls': ['url1', 'url2']}\n", + "{'_id': ObjectId('5d86ec5b28b7b61598f3400c'),\n", + " 'description': 'The list of projects on github with the '\n", + " 'largest number of starts',\n", + " 'first dataset': 'largest projects',\n", + " 'license': 'NA',\n", + " 'topic': 'git URLs',\n", + " 'urls': ['url1', 'url2']}\n", + "{'_id': ObjectId('5d87b217995d246453e1025e'),\n", + " 'description': 'The list of projects on github with the '\n", + " 'largest number of starts',\n", + " 'first dataset': 'largest projects',\n", + " 'license': 'NA',\n", + " 'topic': 'git URLs',\n", + " 'urls': ['url1', 'url2']}\n", + "{'_id': ObjectId('5d880f112a39947906f91d60'),\n", + " 'description': 'The list of projects on github with the '\n", + " 'largest number of starts',\n", + " 'first dataset': 'largest projects',\n", + " 'license': 'NA',\n", + " 'topic': 'git URLs',\n", + " 'urls': ['url1', 'url2']}\n", + "{'_id': ObjectId('5d8830f5ba8cb3838c958c6a'),\n", + " 'description': 'The list of projects on github with the '\n", + " 'largest number of starts',\n", + " 'first dataset': 'largest projects',\n", + " 'license': 'NA',\n", + " 'topic': 'git URLs',\n", + " 'urls': ['url1', 'url2']}\n", + "{'_id': ObjectId('5d88315fba8cb383c97d1aed'),\n", + " 'description': 'The list of projects on github with the '\n", + " 'largest number of starts',\n", + " 'first dataset': 'largest projects',\n", + " 'license': 'NA',\n", + " 'topic': 'git URLs',\n", + " 'urls': ['url1', 'url2']}\n", + "{'1st dataset': 'Most popular social media apps in the U.S. '\n", + " '2019',\n", + " '_id': ObjectId('5d8849d8b0978d880b173cb7'),\n", + " 'description': 'popular mobile social networking apps in the '\n", + " 'United States by monthly users',\n", + " 'license': 'Statista 2019',\n", + " 'topic': 'Social Media Usage and Imapct',\n", + " 'urls': ['https://www.statista.com/statistics/248074/most-popular-us-social-networking-apps-ranked-by-audience/']}\n", + "{'2nd dataset': 'Share of U.S. population who use social media '\n", + " '2008-20',\n", + " '_id': ObjectId('5d8849d8b0978d880b173cb8'),\n", + " 'description': '%of US population who use social media from '\n", + " '2008-2019',\n", + " 'license': 'Statista 2019',\n", + " 'topic': 'Social Media Usage and Imapct',\n", + " 'urls': ['https://www.statista.com/statistics/273476/percentage-of-us-population-with-a-social-network-profile/']}\n", + "{'3rd dataset': 'An Analytical Study on Social Media Marketing '\n", + " 'and Online Presence of Brands',\n", + " '_id': ObjectId('5d8849d8b0978d880b173cb9'),\n", + " 'description': 'the impact of Social media marketing on '\n", + " 'communication turn into organizations '\n", + " 'marketing communications plans.',\n", + " 'license': '\\xa0ResearchGate 2019',\n", + " 'topic': 'Social Media Usage and Imapct',\n", + " 'urls': ['https://www.researchgate.net/publication/258768950_An_Analytical_Study_on_Social_Media_Marketing_and_Online_Presence_of_Brands']}\n", + "{'4th dataset': 'NYC Social Media Usage',\n", + " '_id': ObjectId('5d8849d8b0978d880b173cba'),\n", + " 'description': 'Social Media Usage using open data of NewYork '\n", + " 'City',\n", + " 'license': 'CC0: Public Domain',\n", + " 'topic': 'Social Media Usage and Imapct',\n", + " 'urls': ['https://www.kaggle.com/new-york-city/nyc-social-media-usage']}\n", + "{'5th dataset': 'Understanding Police Social Media Usage '\n", + " 'Through Posts and Tweets',\n", + " '_id': ObjectId('5d8849d8b0978d880b173cbb'),\n", + " 'description': 'measuring social media use by government '\n", + " 'agencies or other organizations',\n", + " 'license': 'CC0',\n", + " 'topic': 'Social Media Usage and Imapct',\n", + " 'urls': ['shorturl.at/htKOR']}\n", + "{'6th dataset': 'The impact of social media on attitudes '\n", + " 'towards farm animal welfare',\n", + " '_id': ObjectId('5d8849d8b0978d880b173cbc'),\n", + " 'description': 'the effects of social media on attitudes '\n", + " 'towards farm animal welfare FAW',\n", + " 'license': 'CC BY 4.0 Mendley Data',\n", + " 'topic': 'Social Media Usage and Imapct',\n", + " 'urls': ['https://data.mendeley.com/datasets/cs7kmcfxtg/1']}\n", + "{'7th dataset': 'Global impact of social media on daily life '\n", + " '2019',\n", + " '_id': ObjectId('5d8849d8b0978d880b173cbd'),\n", + " 'description': 'social media platforms have had an impact on '\n", + " 'selected aspects of daily life',\n", + " 'license': 'Statista 2019',\n", + " 'topic': 'Social Media Usage and Imapct',\n", + " 'urls': ['https://www.statista.com/statistics/1015131/impact-of-social-media-on-daily-life-worldwide/']}\n", + "{'8th dataset': 'Negative social media effects on teenagers',\n", + " '_id': ObjectId('5d8849d8b0978d880b173cbe'),\n", + " 'description': 'Negative social media effects on teenagers in '\n", + " 'the USA as of April 2018, by emotional '\n", + " 'well-being',\n", + " 'license': 'Statista 2019',\n", + " 'topic': 'Social Media Usage and Imapct',\n", + " 'urls': ['https://www.statista.com/statistics/934121/negative-social-media-effects-usa-teenagers-emotional-well-being/']}\n", + "{'9th dataset': 'Social impact in social media',\n", + " '_id': ObjectId('5d8849d8b0978d880b173cbf'),\n", + " 'description': 'To identify the potential or real social '\n", + " 'impact of research shared on social media, '\n", + " 'specifically on Twitter and Facebook.',\n", + " 'license': 'creativecommons',\n", + " 'topic': 'Social Media Usage and Imapct',\n", + " 'urls': ['https://plos.figshare.com/articles/Social_impact_in_social_media_A_new_method_to_evaluate_the_social_impact_of_research/7025222']}\n", + "{'10th dataset': 'Journalists views on the impact of social '\n", + " 'media\\xa0',\n", + " '_id': ObjectId('5d8849d8b0978d880b173cc0'),\n", + " 'description': 'the impact of social media use on Journalists '\n", + " 'work in the United States in 2016',\n", + " 'license': 'Statista 2019',\n", + " 'topic': 'Social Media Usage and Imapct',\n", + " 'urls': ['https://www.statista.com/statistics/315891/journalists-views-impact-social-media-usa/']}\n", + "{'11th dataset': 'Teen perspectives on positive effects of '\n", + " 'social media in the U.S. 2018',\n", + " '_id': ObjectId('5d8849d8b0978d880b173cc1'),\n", + " 'description': 'Leading reasons why teenagers in the US feel '\n", + " 'that social media has a mostly positive effect '\n", + " 'on people their own age, April 2018',\n", + " 'license': 'Statista 2019',\n", + " 'topic': 'Social Media Usage and Imapct',\n", + " 'urls': ['https://www.statista.com/statistics/234570/perceived-effect-of-social-media-on-the-emotional-well-being-of-us-teens/']}\n", + "{'12th dataset': 'Social Media: The New Window to Athlete’s '\n", + " 'Soul',\n", + " '_id': ObjectId('5d8849d8b0978d880b173cc2'),\n", + " 'description': 'how social media has an impact on athlete’s '\n", + " 'performance',\n", + " 'license': 'NA',\n", + " 'topic': 'Social Media Usage and Imapct',\n", + " 'urls': ['https://www.kaggle.com/appliedresearcher/social-media-the-new-window-to-athletes-soul']}\n", + "{'13th dataset': 'Social media impact on purchasing according '\n", + " 'to U.S. teens 2013',\n", + " '_id': ObjectId('5d8849d8b0978d880b173cc3'),\n", + " 'description': 'Social media impact on purchasing according to '\n", + " 'teens, in 2013, USA',\n", + " 'license': 'Statista 2019',\n", + " 'topic': 'Social Media Usage and Imapct',\n", + " 'urls': ['https://www.statista.com/statistics/294459/social-media-shopping-impact-us-teens/']}\n", + "{'14th dataset': 'Effects of communication technology on '\n", + " 'relationships in France 2014',\n", + " '_id': ObjectId('5d8849d8b0978d880b173cc4'),\n", + " 'description': 'Extent of the impact of technology on '\n", + " 'relationships with family and friends in '\n", + " 'France 2014',\n", + " 'license': 'Statista 2019',\n", + " 'topic': 'Social Media Usage and Imapct',\n", + " 'urls': ['https://www.statista.com/statistics/417739/impact-of-technology-family-friends-relationships-france/']}\n", + "{'15th dataset': 'Reliability of news due to impact of social '\n", + " 'media worldwide 2013',\n", + " '_id': ObjectId('5d8849d8b0978d880b173cc5'),\n", + " 'description': 'Does social media make news less reliable '\n", + " 'because journalists do less or no fact '\n", + " 'checking',\n", + " 'license': 'Statista 2019',\n", + " 'topic': 'Social Media Usage and Imapct',\n", + " 'urls': ['https://www.statista.com/statistics/315907/journalists-reliable-fact-checking-social-media-worldwide/']}\n", + "{'16th dataset': 'Survey on impact of social media on companies '\n", + " 'in Denmark 2017',\n", + " '_id': ObjectId('5d8849d8b0978d880b173cc6'),\n", + " 'description': 'the impact of social media on companies',\n", + " 'license': 'Statista 2019',\n", + " 'topic': 'Social Media Usage and Imapct',\n", + " 'urls': ['https://www.statista.com/statistics/744209/survey-on-impact-of-social-media-on-companies-in-denmark/']}\n", + "{'17th dataset': 'Huawei Social Network Data',\n", + " '_id': ObjectId('5d8849d8b0978d880b173cc7'),\n", + " 'description': 'Social Media Analysis Helps the Huawei Company '\n", + " 'to improve their businesses ',\n", + " 'license': 'CC BY-NC-SA 4.0',\n", + " 'topic': 'Social Media Usage and Imapct',\n", + " 'urls': ['https://www.kaggle.com/andrewlucci/huawei-social-network-data']}\n", + "{'18th dataset': 'How social media services affect the lives of '\n", + " 'young people in Finland 2016',\n", + " '_id': ObjectId('5d8849d8b0978d880b173cc8'),\n", + " 'description': 'How social media services affect the lives of '\n", + " 'young people in Finland in 2016',\n", + " 'license': 'Statista 2019',\n", + " 'topic': 'Social Media Usage and Imapct',\n", + " 'urls': ['https://www.statista.com/statistics/602118/effect-of-social-media-on-the-life-of-young-people-in-finland/']}\n", + "{'19th dataset': 'Preferred social networks of U.S. teens '\n", + " '2012-2019',\n", + " '_id': ObjectId('5d8849d8b0978d880b173cc9'),\n", + " 'description': 'Most popular social networks of teenagers in '\n", + " 'the United States from fall 2012 to spring '\n", + " '2019',\n", + " 'license': 'Statista 2019',\n", + " 'topic': 'Social Media Usage and Imapct',\n", + " 'urls': ['https://www.statista.com/statistics/250172/social-network-usage-of-us-teens-and-young-adults/']}\n", + "{'20th dataset': 'How News Appears on Social Media',\n", + " '_id': ObjectId('5d8849d8b0978d880b173cca'),\n", + " 'description': 'Comparing Whats on Twitter and Reddit to Whats '\n", + " 'Happening in the World',\n", + " 'license': 'NA',\n", + " 'topic': 'Social Media Usage and Imapct',\n", + " 'urls': ['https://www.kaggle.com/socialmedianews/how-news-appears-on-social-media']}\n", + "{'_id': ObjectId('5d8884b4c42213a0957103f9'),\n", + " 'description': 'The list of projects on github with the '\n", + " 'largest number of starts',\n", + " 'first dataset': 'largest projects',\n", + " 'license': 'NA',\n", + " 'topic': 'git URLs',\n", + " 'urls': ['url1', 'url2']}\n", + "{'_id': ObjectId('5d88d2f4d9d508b83c8acfb2'),\n", + " 'description': 'The list of projects on github with the '\n", + " 'largest number of starts',\n", + " 'first dataset': 'largest projects',\n", + " 'license': 'NA',\n", + " 'topic': 'git URLs',\n", + " 'urls': ['url1', 'url2']}\n", + "{'_id': ObjectId('5d88d7a0c6cd68b894a43b36'),\n", + " 'description': 'Datasets found on temperature records',\n", + " 'first dataset': 'Southeast USA',\n", + " 'license': 'NA',\n", + " 'topic': 'temperature data',\n", + " 'urls': ['https://plos.figshare.com/articles/Heat_in_the_southeastern_United_States_Characteristics_trends_and_potential_health_impact/5011409']}\n", + "{'_id': ObjectId('5d88d7b8c6cd68b894a43b38'),\n", + " 'description': 'Datasets found on temperature records',\n", + " 'first dataset': 'Southeast USA',\n", + " 'license': 'NA',\n", + " 'topic': 'temperature data',\n", + " 'urls': ['https://catalog.data.gov/dataset/u-s-local-climatological-data-lcd',\n", + " 'https://plos.figshare.com/articles/Heat_in_the_southeastern_United_States_Characteristics_trends_and_potential_health_impact/5011409']}\n" + ] + } + ], + "source": [ + "import pprint\n", + "import pymongo, json\n", + "client = pymongo.MongoClient (host=\"da1.eecs.utk.edu\")\n", + "db = client ['fdac19mp2']\n", + "coll = db ['audris']\n", + "pp = pprint.PrettyPrinter(indent=1,width=65)\n", + "for r in coll. find():\n", + " print(pp .pformat (r)) " + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "import pprint\n", + "import pymongo, json\n", + "client = pymongo.MongoClient (host=\"da1.eecs.utk.edu\")\n", + "db = client ['fdac19mp2']\n", + "coll = db ['audris']\n", + "pp = pprint.PrettyPrinter(indent=1,width=65)\n", + "for r in coll. find():\n", + " print(pp .pformat (r)) " + ] + }, + { + "cell_type": "code", + "execution_count": 10, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "" + ] + }, + "execution_count": 10, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "import pprint\n", + "import re\n", + "import pymongo, json\n", + "\n", + "pp = pprint.PrettyPrinter(indent=1,width=65)\n", + "\n", + "client = pymongo.MongoClient (host=\"da1.eecs.utk.edu\")\n", + "db = client ['fdac19mp2']\n", + "coll = db ['zlu21']\n", + "# for each dataset\n", + "coll.insert_one ( { 'topic':'codon usage bias', 'dataset 1': 'largest projects', 'license': 'NA', 'description': 'Variation_and_selection_on_codon_usage', 'urls': [ 'https://figshare.com/articles/Variation_and_selection_on_codon_usage_bias_across_an_entire_subphylum/9200030'] } )\n", + "coll.insert_one ( { 'topic':'codon usage bias', 'dataset 2': 'largest projects', 'license': 'NA', 'description': 'Variation_and_selection_on_codon_usage', 'urls': [ 'https://figshare.com/articles/The_Selective_Advantage_of_Synonymous_Codon_Usage_Bias_in_i_Salmonella_i_/3111637/1'] } )\n", + "coll.insert_one ( { 'topic':'codon usage bias', 'dataset 3': 'largest projects', 'license': 'NA', 'description': 'Variation_and_selection_on_codon_usage', 'urls': [ 'https://omictools.com/762796feea08897dacd8341ab94528b3-dataset'] } )\n", + "coll.insert_one ( { 'topic':'codon usage bias', 'dataset 4': 'largest projects', 'license': 'NA', 'description': 'Variation_and_selection_on_codon_usage', 'urls': [ 'https://datadryad.org/stash/dataset/doi:10.5061/dryad.qm44d'] } )\n", + "coll.insert_one ( { 'topic':'codon usage bias', 'dataset 5': 'largest projects', 'license': 'NA', 'description': 'Variation_and_selection_on_codon_usage', 'urls': [ 'https://datadryad.org/stash/dataset/doi:10.5061/dryad.7b470'] } )\n", + "coll.insert_one ( { 'topic':'codon usage bias', 'dataset 6': 'largest projects', 'license': 'NA', 'description': 'Variation_and_selection_on_codon_usage', 'urls': [ 'https://figshare.com/articles/Table_3_Compositional_Analysis_of_Flatworm_Genomes_Shows_Strong_Codon_Usage_Biases_Across_All_Classes_xlsx/9770996/1'] } )\n", + "coll.insert_one ( { 'topic':'codon usage bias', 'dataset 7': 'largest projects', 'license': 'NA', 'description': 'Variation_and_selection_on_codon_usage', 'urls': [ 'https://datadryad.org/stash/dataset/doi:10.5061/dryad.r0t1q'] } )\n", + "coll.insert_one ( { 'topic':'codon usage bias', 'dataset 8': 'largest projects', 'license': 'NA', 'description': 'Variation_and_selection_on_codon_usage', 'urls': [ 'https://datadryad.org/stash/dataset/doi:10.5061/dryad.3hc5t'] } )\n", + "coll.insert_one ( { 'topic':'codon usage bias', 'dataset 9': 'largest projects', 'license': 'NA', 'description': 'Variation_and_selection_on_codon_usage', 'urls': [ 'https://plos.figshare.com/articles/_Codon_usage_bias_indices_for_TP53_gene_across_mammalian_species_/1354190'] } )\n", + "coll.insert_one ( { 'topic':'codon usage bias', 'dataset 10': 'largest projects', 'license': 'NA', 'description': 'Variation_and_selection_on_codon_usage', 'urls': [ 'https://plos.figshare.com/articles/Comparative_Analysis_of_Codon_Usage_Bias_and_Codon_Context_Patterns_between_Dipteran_and_Hymenopteran_Sequenced_Genomes/121061/1'] } )\n", + "coll.insert_one ( { 'topic':'codon usage bias', 'dataset 11': 'largest projects', 'license': 'NA', 'description': 'Variation_and_selection_on_codon_usage', 'urls': [ 'https://datadryad.org/stash/dataset/doi:10.5061/dryad.4k887'] } )\n", + "coll.insert_one ( { 'topic':'codon usage bias', 'dataset 12': 'largest projects', 'license': 'NA', 'description': 'Variation_and_selection_on_codon_usage', 'urls': [ 'https://figshare.com/articles/Additional_file_2_of_Genome-wide_analysis_of_codon_usage_bias_in_Bovine_Coronavirus/5117068/1'] } )\n", + "coll.insert_one ( { 'topic':'codon usage bias', 'dataset 13': 'largest projects', 'license': 'NA', 'description': 'Variation_and_selection_on_codon_usage', 'urls': [ 'https://www.omicsdi.org/dataset/geo/GSE80130'] } )\n", + "coll.insert_one ( { 'topic':'codon usage bias', 'dataset 14': 'largest projects', 'license': 'NA', 'description': 'Variation_and_selection_on_codon_usage', 'urls': [ 'https://figshare.com/articles/_Genome_Wide_Analysis_of_Codon_Usage_and_Influencing_Factors_in_Chikungunya_Viruses_/951883'] } )\n", + "coll.insert_one ( { 'topic':'codon usage bias', 'dataset 15': 'largest projects', 'license': 'NA', 'description': 'Variation_and_selection_on_codon_usage', 'urls': [ 'https://plos.figshare.com/articles/Codon_usage_bias_reveals_genomic_adaptations_to_environmental_conditions_in_an_acidophilic_consortium/6240251'] } )\n", + "coll.insert_one ( { 'topic':'codon usage bias', 'dataset 16': 'largest projects', 'license': 'NA', 'description': 'Variation_and_selection_on_codon_usage', 'urls': [ 'https://www.researchgate.net/publication/305471626_Genome_wide_calculation_of_codon_usage_in_canine_distemper_virus_strains'] } )\n", + "coll.insert_one ( { 'topic':'codon usage bias', 'dataset 17': 'largest projects', 'license': 'NA', 'description': 'Variation_and_selection_on_codon_usage', 'urls': [ 'https://www.researchgate.net/publication/327133643_S3_Fig'] } )\n", + "coll.insert_one ( { 'topic':'codon usage bias', 'dataset 18': 'largest projects', 'license': 'NA', 'description': 'Variation_and_selection_on_codon_usage', 'urls': [ 'https://www.researchgate.net/publication/293833546_Additional_file_2'] } )\n", + "coll.insert_one ( { 'topic':'codon usage bias', 'dataset 19': 'largest projects', 'license': 'NA', 'description': 'Variation_and_selection_on_codon_usage', 'urls': [ 'https://www.datadryad.org/stash/dataset/doi:10.5061/dryad.9118'] } )\n", + "coll.insert_one ( { 'topic':'codon usage bias', 'dataset 20': 'largest projects', 'license': 'NA', 'description': 'Variation_and_selection_on_codon_usage', 'urls': [ 'https://journals.plos.org/plosone/article?id=10.1371/journal.pone.0194372#sec021'] } )\n" + ] + }, + { + "cell_type": "code", + "execution_count": 11, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "{'_id': ObjectId('5d88dd1b914585b4cbfb3e16'),\n", + " 'description': 'Variation_and_selection_on_codon_usage',\n", + " 'first dataset': 'largest projects',\n", + " 'license': 'NA',\n", + " 'topic': 'codon usage bias',\n", + " 'urls': ['https://figshare.com/articles/Variation_and_selection_on_codon_usage_bias_across_an_entire_subphylum/9200030']}\n", + "{'_id': ObjectId('5d88e39c914585b4cbfb3e19'),\n", + " 'dataset 1': 'largest projects',\n", + " 'description': 'Variation_and_selection_on_codon_usage',\n", + " 'license': 'NA',\n", + " 'topic': 'codon usage bias',\n", + " 'urls': ['https://figshare.com/articles/Variation_and_selection_on_codon_usage_bias_across_an_entire_subphylum/9200030']}\n", + "{'_id': ObjectId('5d88e39c914585b4cbfb3e1a'),\n", + " 'dataset 2': 'largest projects',\n", + " 'description': 'Variation_and_selection_on_codon_usage',\n", + " 'license': 'NA',\n", + " 'topic': 'codon usage bias',\n", + " 'urls': ['https://figshare.com/articles/The_Selective_Advantage_of_Synonymous_Codon_Usage_Bias_in_i_Salmonella_i_/3111637/1']}\n", + "{'_id': ObjectId('5d88e39c914585b4cbfb3e1b'),\n", + " 'dataset 3': 'largest projects',\n", + " 'description': 'Variation_and_selection_on_codon_usage',\n", + " 'license': 'NA',\n", + " 'topic': 'codon usage bias',\n", + " 'urls': ['https://omictools.com/762796feea08897dacd8341ab94528b3-dataset']}\n", + "{'_id': ObjectId('5d88e39c914585b4cbfb3e1c'),\n", + " 'dataset 4': 'largest projects',\n", + " 'description': 'Variation_and_selection_on_codon_usage',\n", + " 'license': 'NA',\n", + " 'topic': 'codon usage bias',\n", + " 'urls': ['https://datadryad.org/stash/dataset/doi:10.5061/dryad.qm44d']}\n", + "{'_id': ObjectId('5d88e39c914585b4cbfb3e1d'),\n", + " 'dataset 5': 'largest projects',\n", + " 'description': 'Variation_and_selection_on_codon_usage',\n", + " 'license': 'NA',\n", + " 'topic': 'codon usage bias',\n", + " 'urls': ['https://datadryad.org/stash/dataset/doi:10.5061/dryad.7b470']}\n", + "{'_id': ObjectId('5d88e39c914585b4cbfb3e1e'),\n", + " 'dataset 6': 'largest projects',\n", + " 'description': 'Variation_and_selection_on_codon_usage',\n", + " 'license': 'NA',\n", + " 'topic': 'codon usage bias',\n", + " 'urls': ['https://figshare.com/articles/Table_3_Compositional_Analysis_of_Flatworm_Genomes_Shows_Strong_Codon_Usage_Biases_Across_All_Classes_xlsx/9770996/1']}\n", + "{'_id': ObjectId('5d88e39c914585b4cbfb3e1f'),\n", + " 'dataset 7': 'largest projects',\n", + " 'description': 'Variation_and_selection_on_codon_usage',\n", + " 'license': 'NA',\n", + " 'topic': 'codon usage bias',\n", + " 'urls': ['https://datadryad.org/stash/dataset/doi:10.5061/dryad.r0t1q']}\n", + "{'_id': ObjectId('5d88e39c914585b4cbfb3e20'),\n", + " 'dataset 8': 'largest projects',\n", + " 'description': 'Variation_and_selection_on_codon_usage',\n", + " 'license': 'NA',\n", + " 'topic': 'codon usage bias',\n", + " 'urls': ['https://datadryad.org/stash/dataset/doi:10.5061/dryad.3hc5t']}\n", + "{'_id': ObjectId('5d88e39c914585b4cbfb3e21'),\n", + " 'dataset 9': 'largest projects',\n", + " 'description': 'Variation_and_selection_on_codon_usage',\n", + " 'license': 'NA',\n", + " 'topic': 'codon usage bias',\n", + " 'urls': ['https://plos.figshare.com/articles/_Codon_usage_bias_indices_for_TP53_gene_across_mammalian_species_/1354190']}\n", + "{'_id': ObjectId('5d88e39c914585b4cbfb3e22'),\n", + " 'dataset 10': 'largest projects',\n", + " 'description': 'Variation_and_selection_on_codon_usage',\n", + " 'license': 'NA',\n", + " 'topic': 'codon usage bias',\n", + " 'urls': ['https://plos.figshare.com/articles/Comparative_Analysis_of_Codon_Usage_Bias_and_Codon_Context_Patterns_between_Dipteran_and_Hymenopteran_Sequenced_Genomes/121061/1']}\n", + "{'_id': ObjectId('5d88e39c914585b4cbfb3e23'),\n", + " 'dataset 11': 'largest projects',\n", + " 'description': 'Variation_and_selection_on_codon_usage',\n", + " 'license': 'NA',\n", + " 'topic': 'codon usage bias',\n", + " 'urls': ['https://datadryad.org/stash/dataset/doi:10.5061/dryad.4k887']}\n", + "{'_id': ObjectId('5d88e39c914585b4cbfb3e24'),\n", + " 'dataset 12': 'largest projects',\n", + " 'description': 'Variation_and_selection_on_codon_usage',\n", + " 'license': 'NA',\n", + " 'topic': 'codon usage bias',\n", + " 'urls': ['https://figshare.com/articles/Additional_file_2_of_Genome-wide_analysis_of_codon_usage_bias_in_Bovine_Coronavirus/5117068/1']}\n", + "{'_id': ObjectId('5d88e39c914585b4cbfb3e25'),\n", + " 'dataset 13': 'largest projects',\n", + " 'description': 'Variation_and_selection_on_codon_usage',\n", + " 'license': 'NA',\n", + " 'topic': 'codon usage bias',\n", + " 'urls': ['https://www.omicsdi.org/dataset/geo/GSE80130']}\n", + "{'_id': ObjectId('5d88e39c914585b4cbfb3e26'),\n", + " 'dataset 14': 'largest projects',\n", + " 'description': 'Variation_and_selection_on_codon_usage',\n", + " 'license': 'NA',\n", + " 'topic': 'codon usage bias',\n", + " 'urls': ['https://figshare.com/articles/_Genome_Wide_Analysis_of_Codon_Usage_and_Influencing_Factors_in_Chikungunya_Viruses_/951883']}\n", + "{'_id': ObjectId('5d88e39c914585b4cbfb3e27'),\n", + " 'dataset 15': 'largest projects',\n", + " 'description': 'Variation_and_selection_on_codon_usage',\n", + " 'license': 'NA',\n", + " 'topic': 'codon usage bias',\n", + " 'urls': ['https://plos.figshare.com/articles/Codon_usage_bias_reveals_genomic_adaptations_to_environmental_conditions_in_an_acidophilic_consortium/6240251']}\n", + "{'_id': ObjectId('5d88e39c914585b4cbfb3e28'),\n", + " 'dataset 16': 'largest projects',\n", + " 'description': 'Variation_and_selection_on_codon_usage',\n", + " 'license': 'NA',\n", + " 'topic': 'codon usage bias',\n", + " 'urls': ['https://www.researchgate.net/publication/305471626_Genome_wide_calculation_of_codon_usage_in_canine_distemper_virus_strains']}\n", + "{'_id': ObjectId('5d88e39c914585b4cbfb3e29'),\n", + " 'dataset 17': 'largest projects',\n", + " 'description': 'Variation_and_selection_on_codon_usage',\n", + " 'license': 'NA',\n", + " 'topic': 'codon usage bias',\n", + " 'urls': ['https://www.researchgate.net/publication/327133643_S3_Fig']}\n", + "{'_id': ObjectId('5d88e39c914585b4cbfb3e2a'),\n", + " 'dataset 18': 'largest projects',\n", + " 'description': 'Variation_and_selection_on_codon_usage',\n", + " 'license': 'NA',\n", + " 'topic': 'codon usage bias',\n", + " 'urls': ['https://www.researchgate.net/publication/293833546_Additional_file_2']}\n", + "{'_id': ObjectId('5d88e39c914585b4cbfb3e2b'),\n", + " 'dataset 19': 'largest projects',\n", + " 'description': 'Variation_and_selection_on_codon_usage',\n", + " 'license': 'NA',\n", + " 'topic': 'codon usage bias',\n", + " 'urls': ['https://www.datadryad.org/stash/dataset/doi:10.5061/dryad.9118']}\n", + "{'_id': ObjectId('5d88e39c914585b4cbfb3e2c'),\n", + " 'dataset 20': 'largest projects',\n", + " 'description': 'Variation_and_selection_on_codon_usage',\n", + " 'license': 'NA',\n", + " 'topic': 'codon usage bias',\n", + " 'urls': ['https://journals.plos.org/plosone/article?id=10.1371/journal.pone.0194372#sec021']}\n" + ] + } + ], + "source": [ + "import pprint\n", + "import pymongo, json\n", + "client = pymongo.MongoClient (host=\"da1.eecs.utk.edu\")\n", + "db = client ['fdac19mp2']\n", + "coll = db ['zlu21']\n", + "pp = pprint.PrettyPrinter(indent=1,width=65)\n", + "for r in coll. find():\n", + " print(pp .pformat (r)) " + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [] + } + ], + "metadata": { + "kernelspec": { + "display_name": "Python 3", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.6.7" + } + }, + "nbformat": 4, + "nbformat_minor": 1 +}