Skip to content
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
306 changes: 306 additions & 0 deletions .ipynb_checkpoints/zyang37-checkpoint.ipynb
Original file line number Diff line number Diff line change
@@ -0,0 +1,306 @@
{
"cells": [
{
"cell_type": "code",
"execution_count": 57,
"metadata": {},
"outputs": [
{
"name": "stderr",
"output_type": "stream",
"text": [
"/usr/local/lib/python3.6/dist-packages/ipykernel_launcher.py:15: DeprecationWarning: insert is deprecated. Use insert_one or insert_many instead.\n",
" from ipykernel import kernelapp as app\n"
]
},
{
"data": {
"text/plain": [
"ObjectId('5d84f3262d00ba2e15691013')"
]
},
"execution_count": 57,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"# simply ran it 20 times with different databases' information\n",
"\n",
"import pprint\n",
"import re\n",
"import pymongo, json\n",
"\n",
"pp = pprint.PrettyPrinter(indent=1,width=65)\n",
"\n",
"client = pymongo.MongoClient (host=\"da1.eecs.utk.edu\")\n",
"db = client ['fdac19mp2']\n",
"coll = db ['zyang37']\n",
"# for each dataset\n",
"coll.insert ( { 'topic':'Mat-Su Borough Land Sales', \n",
" 'title': 'Mat-Su Borough Land Sales', \n",
" 'license': 'Matanuska Susitna Borough Land Sale and Tax & LID Foreclosure Sale Viewer', \n",
" 'description': 'The Mat-Su Borough Land Sale Application has been developed as an interactive tool for previewing and researching properties available through the borough’s different land sale programs. ', \n",
" 'urls': ['https://data1-msb.opendata.arcgis.com/items/08d489a99ebe447eb87e99f018c96100'] } )\n"
]
},
{
"cell_type": "code",
"execution_count": 58,
"metadata": {},
"outputs": [
{
"name": "stderr",
"output_type": "stream",
"text": [
"/usr/local/lib/python3.6/dist-packages/ipykernel_launcher.py:1: DeprecationWarning: count is deprecated. Use estimated_document_count or count_documents instead. Please note that $where must be replaced by $expr, $near must be replaced by $geoWithin with $center, and $nearSphere must be replaced by $geoWithin with $centerSphere\n",
" \"\"\"Entry point for launching an IPython kernel.\n"
]
},
{
"data": {
"text/plain": [
"20"
]
},
"execution_count": 58,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"coll.count()"
]
},
{
"cell_type": "code",
"execution_count": 59,
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"{'_id': ObjectId('5d84eb402d00ba2e15690fdb'),\n",
" 'description': 'The labelled data set consists of 25,000 IMDB '\n",
" 'movie reviews, specially selected for '\n",
" 'sentiment analysis.',\n",
" 'license': 'Unknown',\n",
" 'title': 'MovieReviewTrainingDatabase.csv ',\n",
" 'topic': 'IMBD Movie Reviews For Binary Sentiment Analysis',\n",
" 'urls': ['https://www.kaggle.com/mwallerphunware/imbd-movie-reviews-for-binary-sentiment-analysis']}\n",
"{'_id': ObjectId('5d84ecb52d00ba2e15690fde'),\n",
" 'description': 'Netflix held the Netflix Prize open '\n",
" 'competition for the best algorithm to predict '\n",
" 'user ratings for films. The grand prize was '\n",
" \"$1,000,000 and was won by BellKor's Pragmatic \"\n",
" 'Chaos team. This is the dataset that was used '\n",
" 'in that competition.',\n",
" 'license': 'Unknown',\n",
" 'title': 'Netflix Prize data',\n",
" 'topic': 'Netflix Prize data',\n",
" 'urls': [' https://archive.org/download/nf_prize_dataset.tar']}\n",
"{'_id': ObjectId('5d84ed892d00ba2e15690fe0'),\n",
" 'description': 'This table contains 25 series, with data for '\n",
" 'years 1956 - present (not all combinations '\n",
" 'necessarily have data for all years).',\n",
" 'license': 'Rights under which the catalog can be reused are '\n",
" 'outlined in the Open Government Licence - Canada',\n",
" 'title': 'Toronto Stock Exchange statistics',\n",
" 'topic': 'Toronto Stock Exchange statistics',\n",
" 'urls': ['https://data.wu.ac.at/schema/www_data_gc_ca/MGUxZTU3YWEtZTY2NC00MWI1LWE2OWYtZDgxNGQ0NDA3ZDYy']}\n",
"{'_id': ObjectId('5d84edf92d00ba2e15690fe3'),\n",
" 'description': 'The statistic presents the total trading value '\n",
" 'of stocks on the first section of the Tokyo '\n",
" 'Stock Exchange (TSE) in Japan from 2008 to '\n",
" '2017',\n",
" 'license': 'Unknown',\n",
" 'title': 'TSE stocks trading value 2008-2017',\n",
" 'topic': 'Statista',\n",
" 'urls': ['https://www.statista.com/statistics/633276/japan-tokyo-stock-exchange-total-trading-value/']}\n",
"{'_id': ObjectId('5d84eec92d00ba2e15690fe6'),\n",
" 'description': 'Graph and download economic data for New One '\n",
" 'Family Homes for Sale in the United States '\n",
" '(HNFSEPUSSA) from Jan 1963 to Jul 2019 about '\n",
" '1-unit structures, family, new, sales, '\n",
" 'housing, and USA.',\n",
" 'license': 'https://research.stlouisfed.org/fred_terms.html',\n",
" 'title': 'New One Family Homes for Sale in the United States',\n",
" 'topic': 'New One Family Homes for Sale in the United States',\n",
" 'urls': ['https://fred.stlouisfed.org/series/HNFSEPUSSA']}\n",
"{'_id': ObjectId('5d84ef292d00ba2e15690fe9'),\n",
" 'description': 'Other Metrics',\n",
" 'license': 'Other',\n",
" 'title': 'For-Sale Inventory (Smooth, SA)',\n",
" 'topic': 'For-Sale Inventory Smooth',\n",
" 'urls': ['https://data.world/zillow-data/for-sale-inventory-smooth']}\n",
"{'_id': ObjectId('5d84ef6b2d00ba2e15690fec'),\n",
" 'description': 'Graph and download economic data for New '\n",
" 'Houses for Sale by Stage of Construction, '\n",
" 'Completed (NHFSEPC) from Jan 1973 to Jul 2019 '\n",
" 'about construction, new, sales, housing, and '\n",
" 'USA.',\n",
" 'license': 'https://research.stlouisfed.org/fred_terms.html',\n",
" 'title': 'New Houses for Sale by Stage of Construction, '\n",
" 'Completed',\n",
" 'topic': 'New Houses for Sale by Stage of Construction, '\n",
" 'Completed',\n",
" 'urls': ['https://fred.stlouisfed.org/series/NHFSEPC']}\n",
"{'_id': ObjectId('5d84efe12d00ba2e15690fef'),\n",
" 'description': 'This dataset was collected by me from car sale '\n",
" 'advertisements for study/practice purposes in '\n",
" '2016.',\n",
" 'license': 'CC0: Public Domain',\n",
" 'title': 'Car Sale Advertisements',\n",
" 'topic': 'Car Sale Advertisements',\n",
" 'urls': ['https://www.kaggle.com/antfarol/car-sale-advertisements']}\n",
"{'_id': ObjectId('5d84f02c2d00ba2e15690ff2'),\n",
" 'description': 'This dataset contains house sale prices for '\n",
" 'King County, which includes Seattle. It '\n",
" 'includes homes sold between May 2014 and May '\n",
" '2015.',\n",
" 'license': 'CC0: Public Domain',\n",
" 'title': 'House Sales in King County, USA',\n",
" 'topic': 'House Sales in King County, USA',\n",
" 'urls': ['https://www.kaggle.com/harlfoxem/housesalesprediction']}\n",
"{'_id': ObjectId('5d84f07e2d00ba2e15690ff5'),\n",
" 'description': 'This dataset contains data on all Real '\n",
" 'Property parcels that have sold since 2013 in '\n",
" 'Allegheny County, PA.',\n",
" 'license': 'http://www.opendefinition.org/licenses/cc-zero',\n",
" 'title': 'Allegheny County Property Sale Transactions',\n",
" 'topic': 'Allegheny County Property Sale Transactions',\n",
" 'urls': ['https://data.wu.ac.at/schema/data_gov/MzRmOWY4YWEtMmZjOC00YTM3LTk1MTgtNzI4NmZhNDNjZGI5']}\n",
"{'_id': ObjectId('5d84f0dd2d00ba2e15690ff8'),\n",
" 'description': 'Under Illinois law, the Treasurer’s Office is '\n",
" 'required to hold an Annual Tax Sale.',\n",
" 'license': 'unknown',\n",
" 'title': 'Treasurer - Annual Tax Sale',\n",
" 'topic': 'Treasurer - Annual Tax Sale',\n",
" 'urls': ['https://datacatalog.cookcountyil.gov/Property-Taxation/Treasurer-Annual-Tax-Sale/55ju-2fs9']}\n",
"{'_id': ObjectId('5d84f1142d00ba2e15690ffb'),\n",
" 'description': 'Graph and download economic data for Total '\n",
" 'Amortized Cost of Available-For-Sale '\n",
" 'Securities for Commercial Banks in Arkansas '\n",
" '(ARTACAFSS) from Q1 1994 to Q2 2019 about '\n",
" 'amortization, cost, AR, securities, '\n",
" 'commercial, sales, banks, depository '\n",
" 'institutions, and USA.',\n",
" 'license': 'https://research.stlouisfed.org/fred_terms.html',\n",
" 'title': 'Total Amortized Cost of Available-For-Sale '\n",
" 'Securities for Commercial Banks in Arkansas',\n",
" 'topic': 'Total Amortized Cost of Available-For-Sale '\n",
" 'Securities for Commercial Banks in Arkansas',\n",
" 'urls': ['https://fred.stlouisfed.org/series/ARTACAFSS']}\n",
"{'_id': ObjectId('5d84f1492d00ba2e15690ffe'),\n",
" 'description': 'This dataset shows licences granted to '\n",
" 'individuals to authorise a sale of alcohol.',\n",
" 'license': 'Open Government Licence',\n",
" 'title': 'Personal licences (sale of alcohol)',\n",
" 'topic': 'Personal licences (sale of alcohol)',\n",
" 'urls': ['https://data.gov.uk/dataset/36fe368c-4841-45b7-b6f2-0ba3a9f9ebac/personal-licences-sale-of-alcohol']}\n",
"{'_id': ObjectId('5d84f1b52d00ba2e15691001'),\n",
" 'description': 'The sales price, buyer, and seller of '\n",
" 'properties sold in the City of Detroit.',\n",
" 'license': 'Public Domain',\n",
" 'title': 'Property Sales History',\n",
" 'topic': 'Property Sales History',\n",
" 'urls': ['https://data.detroitmi.gov/Property-Parcels/Property-Sales-History/xbvp-4is5']}\n",
"{'_id': ObjectId('5d84f1f42d00ba2e15691004'),\n",
" 'description': 'This file contains a list of taxpayers who '\n",
" 'hold an active sales tax permit under Tax Code '\n",
" 'Chapter 151, Subchapter F. The file includes '\n",
" 'taxpayer and outlet information.',\n",
" 'license': 'Public Domain',\n",
" 'title': 'Active Sales Tax Permit Holders',\n",
" 'topic': 'Active Sales Tax Permit Holders',\n",
" 'urls': ['https://data.texas.gov/Government-and-Taxes/Active-Sales-Tax-Permit-Holders/jrea-zgmq']}\n",
"{'_id': ObjectId('5d84f22e2d00ba2e15691007'),\n",
" 'description': \"Apple's iPhone sold more than 217 million \"\n",
" 'devices in 2018.',\n",
" 'license': 'unknown',\n",
" 'title': 'Apple iPhone sales worldwide 2007-2018',\n",
" 'topic': 'Apple iPhone sales worldwide 2007-2018',\n",
" 'urls': ['https://www.statista.com/statistics/276306/global-apple-iphone-sales-since-fiscal-year-2007/']}\n",
"{'_id': ObjectId('5d84f2602d00ba2e1569100a'),\n",
" 'description': 'Graph and download economic data for Average '\n",
" 'Sales Price of Houses Sold for the United '\n",
" 'States (ASPUS) from Q1 1963 to Q2 2019 about '\n",
" 'sales, housing, and USA.',\n",
" 'license': 'https://research.stlouisfed.org/fred_terms.html',\n",
" 'title': 'Average Sales Price of Houses Sold for the United '\n",
" 'States',\n",
" 'topic': 'Average Sales Price of Houses Sold for the United '\n",
" 'States',\n",
" 'urls': ['https://fred.stlouisfed.org/series/ASPUS']}\n",
"{'_id': ObjectId('5d84f2932d00ba2e1569100d'),\n",
" 'description': 'The products listed below are under a current '\n",
" 'stop sale, use, or removal order.',\n",
" 'license': 'unknown',\n",
" 'title': 'Fertilizer Program Stop Sales',\n",
" 'topic': 'Fertilizer Program Stop Sales',\n",
" 'urls': ['https://catalog.data.gov/dataset/fertilizer-program-stop-sales-9e74d']}\n",
"{'_id': ObjectId('5d84f2ed2d00ba2e15691010'),\n",
" 'description': 'Apple iPhone unit sales & revenue',\n",
" 'license': 'CC-BY',\n",
" 'title': 'Quarterly sales and revenue for Apple iPhone Q2/07 - '\n",
" 'Q2/16',\n",
" 'topic': 'iPhone Sales',\n",
" 'urls': ['https://data.world/rflprr/iphone-sales']}\n",
"{'_id': ObjectId('5d84f3262d00ba2e15691013'),\n",
" 'description': 'The Mat-Su Borough Land Sale Application has '\n",
" 'been developed as an interactive tool for '\n",
" 'previewing and researching properties '\n",
" 'available through the borough’s different land '\n",
" 'sale programs. ',\n",
" 'license': 'Matanuska Susitna Borough Land Sale and Tax & LID '\n",
" 'Foreclosure Sale Viewer',\n",
" 'title': 'Mat-Su Borough Land Sales',\n",
" 'topic': 'Mat-Su Borough Land Sales',\n",
" 'urls': ['https://data1-msb.opendata.arcgis.com/items/08d489a99ebe447eb87e99f018c96100']}\n"
]
}
],
"source": [
"import pprint\n",
"import pymongo, json\n",
"client = pymongo.MongoClient (host=\"da1.eecs.utk.edu\")\n",
"db = client ['fdac19mp2']\n",
"coll = db ['zyang37']\n",
"pp = pprint.PrettyPrinter(indent=1,width=65)\n",
"for r in coll. find():\n",
" print(pp .pformat (r)) "
]
},
{
"cell_type": "code",
"execution_count": null,
"metadata": {
"collapsed": true
},
"outputs": [],
"source": []
}
],
"metadata": {
"kernelspec": {
"display_name": "Python 3",
"language": "python",
"name": "python3"
},
"language_info": {
"codemirror_mode": {
"name": "ipython",
"version": 3
},
"file_extension": ".py",
"mimetype": "text/x-python",
"name": "python",
"nbconvert_exporter": "python",
"pygments_lexer": "ipython3",
"version": "3.6.7"
}
},
"nbformat": 4,
"nbformat_minor": 1
}
Loading