diff --git a/topic_extraction.ipynb b/topic_extraction.ipynb
index aef8096..1795510 100644
--- a/topic_extraction.ipynb
+++ b/topic_extraction.ipynb
@@ -16,10 +16,10 @@
},
{
"cell_type": "code",
- "execution_count": 1,
+ "execution_count": 30,
"metadata": {
"id": "gRqJTU_tqNK6",
- "outputId": "834e6fb2-ae3e-4998-abfe-1aa671de77b8",
+ "outputId": "2b263c2e-4bef-4b7d-e5f9-319f8122a4c7",
"colab": {
"base_uri": "https://localhost:8080/"
}
@@ -31,11 +31,8 @@
"text": [
"Requirement already satisfied: nltk in /usr/local/lib/python3.10/dist-packages (3.8.1)\n",
"Requirement already satisfied: pandas in /usr/local/lib/python3.10/dist-packages (2.0.3)\n",
- "Collecting yake\n",
- " Downloading yake-0.4.8-py2.py3-none-any.whl (60 kB)\n",
- "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m60.2/60.2 kB\u001b[0m \u001b[31m1.4 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
- "\u001b[?25hCollecting multi_rake\n",
- " Downloading multi_rake-0.0.2-py3-none-any.whl (31 kB)\n",
+ "Requirement already satisfied: yake in /usr/local/lib/python3.10/dist-packages (0.4.8)\n",
+ "Requirement already satisfied: multi_rake in /usr/local/lib/python3.10/dist-packages (0.0.2)\n",
"Requirement already satisfied: wordcloud in /usr/local/lib/python3.10/dist-packages (1.9.3)\n",
"Requirement already satisfied: click in /usr/local/lib/python3.10/dist-packages (from nltk) (8.1.7)\n",
"Requirement already satisfied: joblib in /usr/local/lib/python3.10/dist-packages (from nltk) (1.4.2)\n",
@@ -46,33 +43,20 @@
"Requirement already satisfied: tzdata>=2022.1 in /usr/local/lib/python3.10/dist-packages (from pandas) (2024.1)\n",
"Requirement already satisfied: numpy>=1.21.0 in /usr/local/lib/python3.10/dist-packages (from pandas) (1.25.2)\n",
"Requirement already satisfied: tabulate in /usr/local/lib/python3.10/dist-packages (from yake) (0.9.0)\n",
- "Collecting segtok (from yake)\n",
- " Downloading segtok-1.5.11-py3-none-any.whl (24 kB)\n",
+ "Requirement already satisfied: segtok in /usr/local/lib/python3.10/dist-packages (from yake) (1.5.11)\n",
"Requirement already satisfied: networkx in /usr/local/lib/python3.10/dist-packages (from yake) (3.3)\n",
"Requirement already satisfied: jellyfish in /usr/local/lib/python3.10/dist-packages (from yake) (1.0.4)\n",
- "Collecting pycld2>=0.41 (from multi_rake)\n",
- " Downloading pycld2-0.41.tar.gz (41.4 MB)\n",
- "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m41.4/41.4 MB\u001b[0m \u001b[31m11.1 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
- "\u001b[?25h Preparing metadata (setup.py) ... \u001b[?25l\u001b[?25hdone\n",
- "Collecting pyrsistent>=0.14.2 (from multi_rake)\n",
- " Downloading pyrsistent-0.20.0-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (117 kB)\n",
- "\u001b[2K \u001b[90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\u001b[0m \u001b[32m117.7/117.7 kB\u001b[0m \u001b[31m4.5 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
- "\u001b[?25hRequirement already satisfied: pillow in /usr/local/lib/python3.10/dist-packages (from wordcloud) (9.4.0)\n",
+ "Requirement already satisfied: pycld2>=0.41 in /usr/local/lib/python3.10/dist-packages (from multi_rake) (0.41)\n",
+ "Requirement already satisfied: pyrsistent>=0.14.2 in /usr/local/lib/python3.10/dist-packages (from multi_rake) (0.20.0)\n",
+ "Requirement already satisfied: pillow in /usr/local/lib/python3.10/dist-packages (from wordcloud) (9.4.0)\n",
"Requirement already satisfied: matplotlib in /usr/local/lib/python3.10/dist-packages (from wordcloud) (3.7.1)\n",
"Requirement already satisfied: six>=1.5 in /usr/local/lib/python3.10/dist-packages (from python-dateutil>=2.8.2->pandas) (1.16.0)\n",
"Requirement already satisfied: contourpy>=1.0.1 in /usr/local/lib/python3.10/dist-packages (from matplotlib->wordcloud) (1.2.1)\n",
"Requirement already satisfied: cycler>=0.10 in /usr/local/lib/python3.10/dist-packages (from matplotlib->wordcloud) (0.12.1)\n",
"Requirement already satisfied: fonttools>=4.22.0 in /usr/local/lib/python3.10/dist-packages (from matplotlib->wordcloud) (4.53.0)\n",
"Requirement already satisfied: kiwisolver>=1.0.1 in /usr/local/lib/python3.10/dist-packages (from matplotlib->wordcloud) (1.4.5)\n",
- "Requirement already satisfied: packaging>=20.0 in /usr/local/lib/python3.10/dist-packages (from matplotlib->wordcloud) (24.0)\n",
- "Requirement already satisfied: pyparsing>=2.3.1 in /usr/local/lib/python3.10/dist-packages (from matplotlib->wordcloud) (3.1.2)\n",
- "Building wheels for collected packages: pycld2\n",
- " Building wheel for pycld2 (setup.py) ... \u001b[?25l\u001b[?25hdone\n",
- " Created wheel for pycld2: filename=pycld2-0.41-cp310-cp310-linux_x86_64.whl size=9904033 sha256=f74226f1f7893878e76b82783d819c22b4f97d5293e2ebaaf90c8e0cd67dd4ea\n",
- " Stored in directory: /root/.cache/pip/wheels/be/81/31/240c89c845e008a93d98542325270007de595bfd356eb0b06c\n",
- "Successfully built pycld2\n",
- "Installing collected packages: pycld2, segtok, pyrsistent, yake, multi_rake\n",
- "Successfully installed multi_rake-0.0.2 pycld2-0.41 pyrsistent-0.20.0 segtok-1.5.11 yake-0.4.8\n"
+ "Requirement already satisfied: packaging>=20.0 in /usr/local/lib/python3.10/dist-packages (from matplotlib->wordcloud) (24.1)\n",
+ "Requirement already satisfied: pyparsing>=2.3.1 in /usr/local/lib/python3.10/dist-packages (from matplotlib->wordcloud) (3.1.2)\n"
]
}
],
@@ -101,49 +85,49 @@
"metadata": {
"id": "5DKM4Sc6szWm"
},
- "execution_count": 2,
+ "execution_count": 31,
"outputs": []
},
{
"cell_type": "code",
- "execution_count": 3,
+ "execution_count": 32,
"metadata": {
"colab": {
"base_uri": "https://localhost:8080/",
- "height": 696
+ "height": 609
},
"id": "Qz4VKs-fPT1V",
- "outputId": "04e49566-d8ba-4584-bde7-cead78d5e748"
+ "outputId": "3bec58ea-712d-4a92-c3e8-e4535b5df1d4"
},
"outputs": [
{
"output_type": "stream",
"name": "stdout",
"text": [
- "(1974, 29)\n"
+ "(1993, 30)\n"
]
},
{
"output_type": "execute_result",
"data": {
"text/plain": [
- " id name description url last_synced_at repository owner packages commits issues_stats events keywords dependencies score created_at updated_at avatar_url language category sub_category monthly_downloads readme funding_links readme_doi_urls works citation_counts total_citations project_url \\\n",
- "0 73419 Py-ART A data model driven interactive toolkit for wo... https://github.com/arm-doe/pyart 2024-06-12 10:01:09.870000+00:00 {'id': 5086348, 'uuid': '6248645', 'full_name'... {'login': 'ARM-DOE', 'name': 'ARM User Facilit... [{'id': 5413461, 'name': 'py-arm-pyart', 'ecos... {'full_name': 'ARM-DOE/pyart', 'default_branch... {'full_name': 'ARM-DOE/pyart', 'html_url': 'ht... None [closember, data-visualization, hacktoberfest,... [{'ecosystem': 'pypi', 'filepath': 'requiremen... 21.013420 2023-09-18 13:18:27.404000+00:00 2024-06-12 10:01:09.901000+00:00 https://github.com/ARM-DOE.png Python Atmosphere Meteorological Observation and Forecast 27001 .. -*- mode: rst -*-\\nThe Python ARM Radar Too... [] [http://doi.org/10.5334/jors.119] {} {} 0 https://ost.ecosyste.ms/api/v1/projects/73419 \n",
- "1 193296 PARETO An Optimization Framework for Produced Water M... https://github.com/project-pareto/project-pareto 2024-06-12 09:30:42.493000+00:00 {'id': 37539257, 'uuid': '375089252', 'full_na... {'login': 'project-pareto', 'name': 'project-p... [] {'full_name': 'project-pareto/project-pareto',... {'full_name': 'project-pareto/project-pareto',... {'total': {'ForkEvent': 23, 'CreateEvent': 26,... [pse] [{'ecosystem': 'actions', 'filepath': '.github... 7.404279 2024-05-24 00:14:46.717000+00:00 2024-06-12 09:30:42.496000+00:00 https://github.com/project-pareto.png Python Natural Resources Water Supply 0 \\n[![All Contributors](https://img.shields.io/badge/all_contributors-54-orange.svg?style=flat-square)](#contributors-)\\n\\n\\n# PlantCV: Plant phenotyping using computer vision\\n\\nPlease use, cite, and [contribute to](http://plantcv.readthedocs.io/en/latest/CONTRIBUTING/) PlantCV!\\nIf you have questions, please submit them via the\\n[GitHub issues page](https://github.com/danforthcenter/plantcv/issues).\\nFollow us on twitter [@plantcv](https://twitter.com/plantcv).\\n\\n***\\n\\n## Introduction to PlantCV\\n\\nPlantCV is an open-source image analysis software package targeted for plant phenotyping. PlantCV provides a common\\nprogramming and documentation interface to a collection of image analysis techniques that are integrated from a variety\\nof source packages and algorithms. PlantCV utilizes a modular architecture that enables flexibility in the design of\\nanalysis workflows and rapid assimilation and integration of new methods. For more information about the project,\\nlinks to recorded presentations, and publications using PlantCV, please visit our homepage: \\n
conda create -n rivgraph_env rivgraph -c conda-forge\\nconda activate rivgraph_env\\n
\\n\\nYou may then want to install Spyder or your preferred IDE. Conda should fetch all the required dependencies and handle versioning.\\n\\nIf you want to install RivGraph into an already-existing environment, you can run conda activate myenv\\nconda install rivgraph -c conda-forge
\\n\\nYou may also [install RivGraph from this Github repo](https://VeinsOfTheEarth.github.io/RivGraph/install/index.html#installation-from-source).\\n\\nInstructions for testing your installation are available [here](https://VeinsOfTheEarth.github.io/RivGraph/install/index.html#installation-from-source).\\n\\nHow to use?\\n-----\\n\\nPlease see the [documentation](https://VeinsOfTheEarth.github.io/RivGraph/) for more detailed instructions.\\n\\nRivGraph requires that you provide a binary mask of your network. [This page](https://VeinsOfTheEarth.github.io/RivGraph/maskmaking/index.html) provides some help, hints, and tools for finding or creating your mask.\\n\\nTo see what RivGraph does and how to operate it, you can work through the [Colville Delta example](https://github.com/VeinsOfTheEarth/RivGraph/blob/master/examples/delta_example.ipynb) or the [Brahmaputra River example](https://github.com/VeinsOfTheEarth/RivGraph/blob/master/examples/braided_river_example.ipynb). Both examples include sample masks.\\n\\nRivGraph contains two primary classes (`delta` and `river`) that provide convenient methods for creating a processing workflow for a channel network. As the examples demonstrate, you can instantiate a delta or river class, then apply associated methods for each. After looking at the examples, take a look at [classes.py](https://github.com/VeinsOfTheEarth/RivGraph/blob/master/rivgraph/classes.py) to understand what methods are available.\\n\\n**Note**: there are many functions under the hood that may be useful to you. Check out the [im_utils script](https://github.com/VeinsOfTheEarth/RivGraph/blob/master/rivgraph/im_utils.py) (image utilities) in particular for functions to help whip your mask into shape!\\n\\nContributing\\n------------\\n\\nIf you think you're not skilled or experienced enough to contribute, think again! We agree wholeheartedly with the sentiments expressed by this [Imposter syndrome disclaimer](https://github.com/Unidata/MetPy#contributing). We welcome all forms of user contributions including feature requests, bug reports, code, documentation requests, and code. Simply open an issue in the [tracker](https://github.com/VeinsOfTheEarth/RivGraph/issues). For code development contributions, please contact us via email to be added to our slack channel where we can hash out a plan for your contribution.\\n\\nCiting RivGraph\\n------------\\n\\nCitations help us justify the effort that goes into building and maintaining this project. If you used RivGraph for your research, please consider citing us.\\n\\nIf you use RivGraph's flow directionality algorithms, please cite our [ESurf Dynamics paper](https://www.earth-surf-dynam.net/8/87/2020/esurf-8-87-2020.html). Additionally, if you publish work wherein RivGraph was used to process your data, please cite our [JOSS Paper](https://joss.theoj.org/papers/10.21105/joss.02952).\\n\\nContacting us\\n-------------\\n\\nThe best way to get in touch is to [open an issue](https://github.com/VeinsOfTheEarth/rivgraph/issues/new) or comment on any open issue or pull request. Otherwise, send an email to j.........k@gmail.com\\n\\nLicense\\n------------\\n\\nThis is free software: you can redistribute it and/or modify it under the terms of the **BSD 3-clause License**. A copy of this license is provided in [LICENSE.txt](https://github.com/VeinsOfTheEarth/RivGraph/blob/master/LICENSE.txt).\\n\\nRivGraph has been assigned number C19049 by the Feynman Center for Innovation.\\n\"\n ],\n \"semantic_type\": \"\",\n \"description\": \"\"\n }\n }\n ]\n}"
}
},
"metadata": {},
- "execution_count": 16
+ "execution_count": 45
}
],
"source": [
- "df['combined'] = combined\n",
+ "# Combine text columns - before was here just the description col in combined\n",
+ "cols_to_combine = ['name','description','category','sub_category','readme']\n",
+ "df['combined'] = df[cols_to_combine].agg(' '.join, axis=1)\n",
"df.head()"
]
},
{
"cell_type": "code",
- "execution_count": 17,
+ "execution_count": 46,
+ "metadata": {
+ "id": "hCI6xTP5aZmv",
+ "collapsed": true
+ },
+ "outputs": [],
+ "source": [
+ "# df['combined'] = combined\n",
+ "# df.head()"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 47,
"metadata": {
"id": "7OXAWga1a8Vv"
},
@@ -1624,7 +1655,7 @@
"metadata": {
"id": "ZoBvEVbz0ezW"
},
- "execution_count": 18,
+ "execution_count": 48,
"outputs": []
},
{
@@ -1637,9 +1668,9 @@
"base_uri": "https://localhost:8080/"
},
"id": "aKWZZ3jdE4Kv",
- "outputId": "a765f421-4642-428f-917f-a2b32b7470d6"
+ "outputId": "ebe67d4b-362d-46c0-81ec-7f3734a98601"
},
- "execution_count": 19,
+ "execution_count": 49,
"outputs": [
{
"output_type": "execute_result",
@@ -1649,7 +1680,7 @@
]
},
"metadata": {},
- "execution_count": 19
+ "execution_count": 49
}
]
},
@@ -1681,16 +1712,42 @@
"metadata": {
"id": "cOLRb0Gjo6K3"
},
- "execution_count": 20,
+ "execution_count": 50,
"outputs": []
},
{
"cell_type": "code",
- "execution_count": 21,
+ "execution_count": 51,
"metadata": {
- "id": "sAX050Xnanob"
+ "id": "sAX050Xnanob",
+ "outputId": "b53ce89d-2551-4f85-ca25-55ba6bbbf71f",
+ "colab": {
+ "base_uri": "https://localhost:8080/"
+ }
},
- "outputs": [],
+ "outputs": [
+ {
+ "output_type": "execute_result",
+ "data": {
+ "text/plain": [
+ "0 cmocean colormap standardizing plotting oceano...\n",
+ "1 traptagger powered camera trap biosphere terre...\n",
+ "2 opem proton membrane fuel energy storage hydro...\n",
+ "3 climlab climate climate earth climate climlab ...\n",
+ "4 fine optimizing energy energy energy ethos fin...\n",
+ " ... \n",
+ "1988 soil freeze thaw soil freeze thaw transport he...\n",
+ "1989 polaris infrastructure cases ocean land exasca...\n",
+ "1990 spacelidar icesat icesat gedi filtered attribu...\n",
+ "1991 flood flood inundation caused tsunami river ra...\n",
+ "1992 goestools signals goes satellites sustainable ...\n",
+ "Name: cleaned_text, Length: 1993, dtype: object"
+ ]
+ },
+ "metadata": {},
+ "execution_count": 51
+ }
+ ],
"source": [
"# Create new column called \"cleaned_text\" and apply different cleaning methods\n",
"df['cleaned_text'] = df['combined'].apply(lambda x: x.replace(\"\\\\n\", \" \")) # Replace \\\\n\n",
@@ -1701,44 +1758,260 @@
"df['cleaned_text'] = df['cleaned_text'].apply(lambda x: ' '.join(x for x in str(x).split() if x.isalpha())) # Remove numbers\n",
"df['cleaned_text'] = df['cleaned_text'].apply(lambda x: ' '.join(x for x in str(x).split() if x not in words_black_list_large)) # Remove words from blacklist\n",
"df['cleaned_text'] = df['cleaned_text'].apply(lambda x: ' '.join(x for x in str(x).split() if x not in stpwords)) # Remove stopwords\n",
- "\n"
+ "\n",
+ "df['cleaned_text']"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 51,
+ "metadata": {
+ "id": "2gqZo79tboxy"
+ },
+ "outputs": [],
+ "source": []
+ },
+ {
+ "cell_type": "markdown",
+ "source": [
+ "# 3.1 Try new Energy Systems subcategories"
+ ],
+ "metadata": {
+ "id": "cQU9awF2zbhY"
+ }
+ },
+ {
+ "cell_type": "code",
+ "source": [
+ "# REMARK Michael: i am using another approach as above. and preprocessing the full 'combined text again here (line 58). With this approach the\n",
+ "# fallback subcategory 'Other' is used only 30 times, whereas when i use the 'cleaned_text' from above i have 98 'Others'. I did not further evaluate why\n",
+ "# this happens and don't have a good intuition at this point why this happens.\n",
+ "\n",
+ "from collections import Counter\n",
+ "\n",
+ "# Expanded list of Energy Systems sub-categories with more keywords\n",
+ "new_energy_subcategories = {\n",
+ " 'Solar Energy': ['photovoltaic', 'solar', 'pv', 'csp', 'concentrated solar power', 'solar thermal', 'solar cell', 'solar panel', 'solar energy'],\n",
+ " 'Wind Energy': ['wind', 'onshore wind', 'offshore wind', 'wind turbine', 'wind farm', 'wind power'],\n",
+ " 'Energy Storage': ['battery', 'storage', 'pumped hydro', 'thermal storage', 'hydrogen storage', 'energy storage', 'lithium-ion', 'flywheel', 'capacitor'],\n",
+ " 'Grid Systems': ['grid', 'smart grid', 'microgrid', 'power distribution', 'electricity network', 'transmission', 'power system'],\n",
+ " 'Energy Efficiency': ['efficiency', 'building energy', 'industrial energy', 'audit', 'energy saving', 'insulation', 'led lighting', 'heat recovery'],\n",
+ " 'Hydroelectric Power': ['hydro', 'hydroelectric', 'run-of-river', 'dam', 'water turbine', 'hydropower'],\n",
+ " 'Geothermal Energy': ['geothermal', 'ground source heat', 'geothermal power', 'earth energy'],\n",
+ " 'Bioenergy': ['biomass', 'biofuel', 'biogas', 'biodiesel', 'ethanol', 'anaerobic digestion'],\n",
+ " 'Hydrogen and Fuel Cells': ['hydrogen', 'fuel cell', 'electrolyzer', 'h2 production', 'hydrogen storage'],\n",
+ " 'Energy System Integration': ['hybrid energy', 'sector coupling', 'system modeling', 'energy system', 'integrated energy', 'multi-energy system'],\n",
+ " 'Energy Markets and Economics': ['energy trading', 'price forecasting', 'energy policy', 'energy market', 'electricity price', 'energy economics'],\n",
+ " 'Emerging Energy Technologies': ['ocean energy', 'tidal', 'wave energy', 'advanced nuclear', 'fusion', 'small modular reactor', 'marine energy'],\n",
+ " 'Energy Data and Analytics': ['energy data', 'energy analytics', 'energy monitoring', 'smart meter', 'energy management system', 'energy forecasting'],\n",
+ " 'Electric Vehicles and Mobility': ['electric vehicle', 'ev charging', 'e-mobility', 'vehicle-to-grid', 'sustainable transport'],\n",
+ " 'Carbon Capture and Storage': ['carbon capture', 'ccs', 'carbon sequestration', 'co2 storage', 'greenhouse gas reduction']\n",
+ "}\n",
+ "\n",
+ "# initialize lemmatizer\n",
+ "lemmatizer = WordNetLemmatizer()\n",
+ "\n",
+ "# Preprocess text\n",
+ "def preprocess_text(text):\n",
+ " if pd.isna(text):\n",
+ " return \"\"\n",
+ " # Convert to lowercase\n",
+ " text = text.lower()\n",
+ " # Remove special characters\n",
+ " text = re.sub(r'[^a-zA-Z0-9\\s]', ' ', text)\n",
+ " # Tokenize\n",
+ " tokens = word_tokenize(text)\n",
+ " # Remove stopwords\n",
+ " tokens = [word for word in tokens if word not in stopwords.words('english')]\n",
+ " # Lemmatize\n",
+ " tokens = [lemmatizer.lemmatize(word) for word in tokens]\n",
+ " return ' '.join(tokens)\n",
+ "\n",
+ "# Function to assign a single new sub-category\n",
+ "def assign_single_subcategory(text):\n",
+ " text = preprocess_text(text)\n",
+ " category_scores = {}\n",
+ " for category, keywords in new_energy_subcategories.items():\n",
+ " score = sum(text.count(keyword) for keyword in keywords)\n",
+ " category_scores[category] = score\n",
+ "\n",
+ " # Find the category with the highest score\n",
+ " best_category = max(category_scores, key=category_scores.get)\n",
+ "\n",
+ " # If no keywords were found, assign 'Other'\n",
+ " return best_category if category_scores[best_category] > 0 else 'Other'\n",
+ "\n",
+ "# preprocess the combined text\n",
+ "df['cleand_text_michael'] = df['combined'].apply(preprocess_text)\n",
+ "\n",
+ "# Apply the new categorization only to 'Energy Systems' category\n",
+ "df['new_energy_subcategory'] = df.apply(lambda row: assign_single_subcategory(row['cleand_text_michael']) if row['category'] == 'Energy Systems' else 'Not an Energy System', axis=1)\n",
+ "\n",
+ "# Calculate the distribution of subcategories\n",
+ "energy_subcategory_distribution = df[df['category'] == 'Energy Systems']['new_energy_subcategory'].value_counts()\n",
+ "\n",
+ "print(\"Distribution of new Energy Systems sub-categories:\")\n",
+ "print(energy_subcategory_distribution)"
+ ],
+ "metadata": {
+ "id": "KgAFIdqhzXqM",
+ "outputId": "ade63f4c-5804-41f5-b331-ceb027f19d35",
+ "colab": {
+ "base_uri": "https://localhost:8080/"
+ }
+ },
+ "execution_count": 52,
+ "outputs": [
+ {
+ "output_type": "stream",
+ "name": "stdout",
+ "text": [
+ "Distribution of new Energy Systems sub-categories:\n",
+ "new_energy_subcategory\n",
+ "Grid Systems 76\n",
+ "Energy System Integration 54\n",
+ "Wind Energy 23\n",
+ "Energy Storage 18\n",
+ "Solar Energy 13\n",
+ "Energy Data and Analytics 10\n",
+ "Hydroelectric Power 7\n",
+ "Energy Efficiency 4\n",
+ "Energy Markets and Economics 3\n",
+ "Name: count, dtype: int64\n"
+ ]
+ }
+ ]
+ },
+ {
+ "cell_type": "code",
+ "source": [
+ "# Visualize the new sub-category distribution\n",
+ "import matplotlib.pyplot as plt\n",
+ "\n",
+ "plt.figure(figsize=(12, 6))\n",
+ "energy_subcategory_distribution.plot(kind='bar')\n",
+ "plt.title('Distribution of New Energy Systems Sub-Categories')\n",
+ "plt.xlabel('Sub-Category')\n",
+ "plt.ylabel('Number of Projects')\n",
+ "plt.xticks(rotation=45, ha='right')\n",
+ "plt.tight_layout()\n",
+ "plt.show()"
+ ],
+ "metadata": {
+ "id": "9yNm2GmEZT6q",
+ "outputId": "6527de91-681c-4fdb-bbde-73da21b96bd5",
+ "colab": {
+ "base_uri": "https://localhost:8080/",
+ "height": 607
+ }
+ },
+ "execution_count": 53,
+ "outputs": [
+ {
+ "output_type": "display_data",
+ "data": {
+ "text/plain": [
+ "pandas.core.frame.DataFrame
def __init__(data=None, index: Axes | None=None, columns: Axes | None=None, dtype: Dtype | None=None, copy: bool | None=None) -> None
\n", - " \n", - " Two-dimensional, size-mutable, potentially heterogeneous tabular data.\n", - "\n", - "Data structure also contains labeled axes (rows and columns).\n", - "Arithmetic operations align on both row and column labels. Can be\n", - "thought of as a dict-like container for Series objects. The primary\n", - "pandas data structure.\n", - "\n", - "Parameters\n", - "----------\n", - "data : ndarray (structured or homogeneous), Iterable, dict, or DataFrame\n", - " Dict can contain Series, arrays, constants, dataclass or list-like objects. If\n", - " data is a dict, column order follows insertion-order. If a dict contains Series\n", - " which have an index defined, it is aligned by its index. This alignment also\n", - " occurs if data is a Series or a DataFrame itself. Alignment is done on\n", - " Series/DataFrame inputs.\n", - "\n", - " If data is a list of dicts, column order follows insertion-order.\n", - "\n", - "index : Index or array-like\n", - " Index to use for resulting frame. Will default to RangeIndex if\n", - " no indexing information part of input data and no index provided.\n", - "columns : Index or array-like\n", - " Column labels to use for resulting frame when data does not have them,\n", - " defaulting to RangeIndex(0, 1, 2, ..., n). If data contains column labels,\n", - " will perform column selection instead.\n", - "dtype : dtype, default None\n", - " Data type to force. Only a single dtype is allowed. If None, infer.\n", - "copy : bool or None, default None\n", - " Copy data from inputs.\n", - " For dict data, the default of None behaves like ``copy=True``. For DataFrame\n", - " or 2d ndarray input, the default of None behaves like ``copy=False``.\n", - " If data is a dict containing one or more Series (possibly of different dtypes),\n", - " ``copy=False`` will ensure that these inputs are not copied.\n", - "\n", - " .. versionchanged:: 1.3.0\n", - "\n", - "See Also\n", - "--------\n", - "DataFrame.from_records : Constructor from tuples, also record arrays.\n", - "DataFrame.from_dict : From dicts of Series, arrays, or dicts.\n", - "read_csv : Read a comma-separated values (csv) file into DataFrame.\n", - "read_table : Read general delimited file into DataFrame.\n", - "read_clipboard : Read text from clipboard into DataFrame.\n", - "\n", - "Notes\n", - "-----\n", - "Please reference the :ref:`User Guide <basics.dataframe>` for more information.\n", - "\n", - "Examples\n", - "--------\n", - "Constructing DataFrame from a dictionary.\n", - "\n", - ">>> d = {'col1': [1, 2], 'col2': [3, 4]}\n", - ">>> df = pd.DataFrame(data=d)\n", - ">>> df\n", - " col1 col2\n", - "0 1 3\n", - "1 2 4\n", - "\n", - "Notice that the inferred dtype is int64.\n", - "\n", - ">>> df.dtypes\n", - "col1 int64\n", - "col2 int64\n", - "dtype: object\n", - "\n", - "To enforce a single dtype:\n", - "\n", - ">>> df = pd.DataFrame(data=d, dtype=np.int8)\n", - ">>> df.dtypes\n", - "col1 int8\n", - "col2 int8\n", - "dtype: object\n", - "\n", - "Constructing DataFrame from a dictionary including Series:\n", - "\n", - ">>> d = {'col1': [0, 1, 2, 3], 'col2': pd.Series([2, 3], index=[2, 3])}\n", - ">>> pd.DataFrame(data=d, index=[0, 1, 2, 3])\n", - " col1 col2\n", - "0 0 NaN\n", - "1 1 NaN\n", - "2 2 2.0\n", - "3 3 3.0\n", - "\n", - "Constructing DataFrame from numpy ndarray:\n", - "\n", - ">>> df2 = pd.DataFrame(np.array([[1, 2, 3], [4, 5, 6], [7, 8, 9]]),\n", - "... columns=['a', 'b', 'c'])\n", - ">>> df2\n", - " a b c\n", - "0 1 2 3\n", - "1 4 5 6\n", - "2 7 8 9\n", - "\n", - "Constructing DataFrame from a numpy ndarray that has labeled columns:\n", - "\n", - ">>> data = np.array([(1, 2, 3), (4, 5, 6), (7, 8, 9)],\n", - "... dtype=[("a", "i4"), ("b", "i4"), ("c", "i4")])\n", - ">>> df3 = pd.DataFrame(data, columns=['c', 'a'])\n", - "...\n", - ">>> df3\n", - " c a\n", - "0 3 1\n", - "1 6 4\n", - "2 9 7\n", - "\n", - "Constructing DataFrame from dataclass:\n", - "\n", - ">>> from dataclasses import make_dataclass\n", - ">>> Point = make_dataclass("Point", [("x", int), ("y", int)])\n", - ">>> pd.DataFrame([Point(0, 0), Point(0, 3), Point(2, 3)])\n", - " x y\n", - "0 0 0\n", - "1 0 3\n", - "2 2 3\n", - "\n", - "Constructing DataFrame from Series/DataFrame:\n", - "\n", - ">>> ser = pd.Series([1, 2, 3], index=["a", "b", "c"])\n", - ">>> df = pd.DataFrame(data=ser, index=["a", "c"])\n", - ">>> df\n", - " 0\n", - "a 1\n", - "c 3\n", - "\n", - ">>> df1 = pd.DataFrame([1, 2, 3], index=["a", "b", "c"], columns=["x"])\n", - ">>> df2 = pd.DataFrame(data=df1, index=["a", "c"])\n", - ">>> df2\n", - " x\n", - "a 1\n", - "c 3
\n", - " | count | \n", - "
---|---|
(time, series) | \n", - "35 | \n", - "
(climate, change) | \n", - "34 | \n", - "
(machine, learning) | \n", - "30 | \n", - "
(energy, systems) | \n", - "30 | \n", - "
(real, time) | \n", - "25 | \n", - "
(power, system) | \n", - "25 | \n", - "
(earth, system) | \n", - "25 | \n", - "
(energy, system) | \n", - "23 | \n", - "
(energy, consumption) | \n", - "20 | \n", - "
(deep, learning) | \n", - "19 | \n", - "
(remote, sensing) | \n", - "19 | \n", - "
(power, systems) | \n", - "18 | \n", - "
(water, quality) | \n", - "18 | \n", - "
(renewable, energy) | \n", - "16 | \n", - "
(life, cycle) | \n", - "15 | \n", - "
(radiative, transfer) | \n", - "14 | \n", - "
(high, resolution) | \n", - "14 | \n", - "
(weather, climate) | \n", - "12 | \n", - "
(large, scale) | \n", - "12 | \n", - "
(long, term) | \n", - "12 | \n", - "
(curated, list) | \n", - "11 | \n", - "
(high, performance) | \n", - "11 | \n", - "
(integrated, assessment) | \n", - "11 | \n", - "
(around, world) | \n", - "11 | \n", - "
(surface, water) | \n", - "11 | \n", - "
(modeling, system) | \n", - "10 | \n", - "
(sustainable, development) | \n", - "10 | \n", - "
(carbon, footprint) | \n", - "10 | \n", - "
(earth, science) | \n", - "10 | \n", - "
(wind, energy) | \n", - "10 | \n", - "
(modeling, framework) | \n", - "10 | \n", - "
(earth, engine) | \n", - "9 | \n", - "
(energy, efficiency) | \n", - "9 | \n", - "
(building, energy) | \n", - "9 | \n", - "
(species, distribution) | \n", - "9 | \n", - "
(power, plants) | \n", - "9 | \n", - "
(aims, provide) | \n", - "9 | \n", - "
(system, models) | \n", - "9 | \n", - "
(earth, observation) | \n", - "9 | \n", - "
(input, output) | \n", - "9 | \n", - "
(cycle, assessment) | \n", - "9 | \n", - "
(carbon, emissions) | \n", - "9 | \n", - "
(system, modeling) | \n", - "9 | \n", - "
(point, clouds) | \n", - "8 | \n", - "
(google, earth) | \n", - "8 | \n", - "
(electric, vehicle) | \n", - "8 | \n", - "
(wind, turbine) | \n", - "8 | \n", - "
(united, states) | \n", - "8 | \n", - "
(british, columbia) | \n", - "8 | \n", - "
(decision, support) | \n", - "8 | \n", - "
(reinforcement, learning) | \n", - "8 | \n", - "
(greenhouse, emissions) | \n", - "8 | \n", - "
(wind, farm) | \n", - "8 | \n", - "
(electricity, market) | \n", - "7 | \n", - "
(agent, based) | \n", - "7 | \n", - "
(wind, turbines) | \n", - "7 | \n", - "
(climate, weather) | \n", - "7 | \n", - "
(distribution, models) | \n", - "7 | \n", - "
(command, line) | \n", - "7 | \n", - "
(energy, storage) | \n", - "7 | \n", - "
(simulation, program) | \n", - "7 | \n", - "
(community, driven) | \n", - "7 | \n", - "
(land, surface) | \n", - "7 | \n", - "
(multi, scale) | \n", - "7 | \n", - "
(satellite, imagery) | \n", - "7 | \n", - "
(development, goals) | \n", - "7 | \n", - "
(power, flow) | \n", - "7 | \n", - "
(numerical, weather) | \n", - "7 | \n", - "
(greenhouse, gases) | \n", - "7 | \n", - "
(neural, network) | \n", - "7 | \n", - "
(monte, carlo) | \n", - "6 | \n", - "
(energy, management) | \n", - "6 | \n", - "
(solar, energy) | \n", - "6 | \n", - "
(soil, moisture) | \n", - "6 | \n", - "
(energy, resources) | \n", - "6 | \n", - "
(learning, models) | \n", - "6 | \n", - "
(climate, science) | \n", - "6 | \n", - "
(biodiversity, information) | \n", - "6 | \n", - "
(water, balance) | \n", - "6 | \n", - "
(modeling, simulation) | \n", - "6 | \n", - "
(artificial, intelligence) | \n", - "6 | \n", - "
(carbon, intensity) | \n", - "6 | \n", - "
(satellite, images) | \n", - "6 | \n", - "
(climate, models) | \n", - "6 | \n", - "
(carbon, cycle) | \n", - "6 | \n", - "
(environmental, impacts) | \n", - "6 | \n", - "
(provides, access) | \n", - "6 | \n", - "
(provides, tools) | \n", - "6 | \n", - "
(soil, water) | \n", - "6 | \n", - "
(provides, functions) | \n", - "6 | \n", - "
(simulation, models) | \n", - "6 | \n", - "
(solar, cells) | \n", - "6 | \n", - "
(distributed, energy) | \n", - "5 | \n", - "
(land, cover) | \n", - "5 | \n", - "
(citizen, science) | \n", - "5 | \n", - "
(modelica, library) | \n", - "5 | \n", - "
(three, dimensional) | \n", - "5 | \n", - "
(post, processing) | \n", - "5 | \n", - "
(energy, information) | \n", - "5 | \n", - "
(capacity, expansion) | \n", - "5 | \n", - "
(simulation, tool) | \n", - "5 | \n", - "
(quality, control) | \n", - "5 | \n", - "
(weather, prediction) | \n", - "5 | \n", - "
(circular, economy) | \n", - "5 | \n", - "
(process, based) | \n", - "5 | \n", - "
(energy, sector) | \n", - "5 | \n", - "
(atmospheric, science) | \n", - "5 | \n", - "
(water, resources) | \n", - "5 | \n", - "
(widely, used) | \n", - "5 | \n", - "
(land, land) | \n", - "5 | \n", - "
(system, analysis) | \n", - "5 | \n", - "
(power, consumption) | \n", - "5 | \n", - "
(environmental, impact) | \n", - "5 | \n", - "
(information, system) | \n", - "5 | \n", - "
(easy, access) | \n", - "5 | \n", - "
(impact, climate) | \n", - "5 | \n", - "
(offshore, wind) | \n", - "5 | \n", - "
(computer, vision) | \n", - "5 | \n", - "
(decision, making) | \n", - "5 | \n", - "
(free, software) | \n", - "5 | \n", - "
(optimization, tool) | \n", - "5 | \n", - "
(finite, volume) | \n", - "5 | \n", - "
(urban, energy) | \n", - "5 | \n", - "
(software, tools) | \n", - "5 | \n", - "
(provides, easy) | \n", - "5 | \n", - "
(designed, help) | \n", - "4 | \n", - "
(individual, tree) | \n", - "4 | \n", - "
(based, optimization) | \n", - "4 | \n", - "
(remotely, sensed) | \n", - "4 | \n", - "
(learning, tools) | \n", - "4 | \n", - "
(visualization, analysis) | \n", - "4 | \n", - "
(energy, balance) | \n", - "4 | \n", - "
(analysis, framework) | \n", - "4 | \n", - "
(object, oriented) | \n", - "4 | \n", - "
(public, transport) | \n", - "4 | \n", - "
(power, grid) | \n", - "4 | \n", - "
(cloud, microphysics) | \n", - "4 | \n", - "
(information, administration) | \n", - "4 | \n", - "
(iucn, list) | \n", - "4 | \n", - "
(climate, system) | \n", - "4 | \n", - "
(eddy, simulation) | \n", - "4 | \n", - "
(information, facility) | \n", - "4 | \n", - "
(tools, working) | \n", - "4 | \n", - "
(utility, scale) | \n", - "4 | \n", - "
(stock, assessment) | \n", - "4 | \n", - "
(electricity, system) | \n", - "4 | \n", - "
(analysis, platform) | \n", - "4 | \n", - "
(energy, generation) | \n", - "4 | \n", - "
(electricity, generation) | \n", - "4 | \n", - "
(energy, policy) | \n", - "4 | \n", - "
(detection, airborne) | \n", - "4 | \n", - "
(environmental, economic) | \n", - "4 | \n", - "
(benchmark, dataset) | \n", - "4 | \n", - "
(balance, system) | \n", - "4 | \n", - "
(weather, radar) | \n", - "4 | \n", - "
(wind, farms) | \n", - "4 | \n", - "
(forest, carbon) | \n", - "4 | \n", - "
(hydrological, models) | \n", - "4 | \n", - "
(electric, vehicles) | \n", - "4 | \n", - "
(global, weather) | \n", - "4 | \n", - "
(decision, makers) | \n", - "4 | \n", - "
(fisheries, stock) | \n", - "4 | \n", - "
(climate, carbon) | \n", - "4 | \n", - "
(heating, cooling) | \n", - "4 | \n", - "
(global, climate) | \n", - "4 | \n", - "
(simulation, optimization) | \n", - "4 | \n", - "
(battery, models) | \n", - "4 | \n", - "
(download, process) | \n", - "4 | \n", - "
(water, flow) | \n", - "4 | \n", - "
(atmospheric, oceanic) | \n", - "4 | \n", - "
(wind, solar) | \n", - "4 | \n", - "
(short, term) | \n", - "4 | \n", - "
(coastal, ocean) | \n", - "4 | \n", - "
(analysis, visualization) | \n", - "4 | \n", - "
(climate, analysis) | \n", - "4 | \n", - "
(statistical, downscaling) | \n", - "4 | \n", - "
(list, awesome) | \n", - "4 | \n", - "
(climate, policy) | \n", - "4 | \n", - "
(tool, developed) | \n", - "4 | \n", - "
(whole, building) | \n", - "4 | \n", - "
(collection, tools) | \n", - "4 | \n", - "
(surface, temperature) | \n", - "4 | \n", - "
(tools, processing) | \n", - "4 | \n", - "
(modeling, tool) | \n", - "4 | \n", - "
(systems, modeling) | \n", - "4 | \n", - "
(residential, buildings) | \n", - "4 | \n", - "
(wide, range) | \n", - "4 | \n", - "
(analysis, tool) | \n", - "4 | \n", - "
(energy, usage) | \n", - "4 | \n", - "
(energy, market) | \n", - "4 | \n", - "
(next, generation) | \n", - "4 | \n", - "
(search, download) | \n", - "4 | \n", - "
(finite, element) | \n", - "4 | \n", - "
(sentinel, sentinel) | \n", - "4 | \n", - "
(wave, energy) | \n", - "4 | \n", - "
(software, libraries) | \n", - "4 | \n", - "
(impact, assessment) | \n", - "4 | \n", - "
(airborne, lidar) | \n", - "4 | \n", - "
(ecological, niche) | \n", - "4 | \n", - "
(niche, models) | \n", - "4 | \n", - "
(spatial, temporal) | \n", - "4 | \n", - "
(environment, climate) | \n", - "4 | \n", - "
(change, canada) | \n", - "4 | \n", - "
(solar, radiation) | \n", - "4 | \n", - "
(climate, scenarios) | \n", - "4 | \n", - "
(interface, download) | \n", - "4 | \n", - "
(domain, specific) | \n", - "4 | \n", - "
(change, analysis) | \n", - "4 | \n", - "
(optimization, modeling) | \n", - "4 | \n", - "
(forest, management) | \n", - "4 | \n", - "
(global, change) | \n", - "4 | \n", - "
(future, energy) | \n", - "4 | \n", - "
(weather, forecasts) | \n", - "4 | \n", - "
(general, circulation) | \n", - "4 | \n", - "
(large, eddy) | \n", - "4 | \n", - "
(interface, world) | \n", - "4 | \n", - "
(linear, programming) | \n", - "4 | \n", - "
(nasa, earth) | \n", - "4 | \n", - "
(energy, modeling) | \n", - "4 | \n", - "
(home, assistant) | \n", - "4 | \n", - "
(learning, based) | \n", - "4 | \n", - "
(global, biodiversity) | \n", - "4 | \n", - "
(analysis, tools) | \n", - "4 | \n", - "
(software, toolkit) | \n", - "4 | \n", - "
(solar, thermal) | \n", - "4 | \n", - "
(software, tool) | \n", - "4 | \n", - "
(wind, speed) | \n", - "4 | \n", - "
(storage, systems) | \n", - "4 | \n", - "
(building, stock) | \n", - "4 | \n", - "
(different, types) | \n", - "4 | \n", - "
(publicly, available) | \n", - "4 | \n", - "
(particulate, matter) | \n", - "4 | \n", - "
(earth, environmental) | \n", - "3 | \n", - "
(energy, sources) | \n", - "3 | \n", - "
(policy, simulator) | \n", - "3 | \n", - "
(electricity, demand) | \n", - "3 | \n", - "
(energy, related) | \n", - "3 | \n", - "
(global, soil) | \n", - "3 | \n", - "
(tool, evaluating) | \n", - "3 | \n", - "
(electrical, grid) | \n", - "3 | \n", - "
(extended, input) | \n", - "3 | \n", - "
(environmentally, extended) | \n", - "3 | \n", - "
(design, optimization) | \n", - "3 | \n", - "
(atmospheric, composition) | \n", - "3 | \n", - "
(ocean, state) | \n", - "3 | \n", - "
(commonly, used) | \n", - "3 | \n", - "
(digital, services) | \n", - "3 | \n", - "
(framework, modeling) | \n", - "3 | \n", - "
(performance, simulation) | \n", - "3 | \n", - "
(heat, pump) | \n", - "3 | \n", - "
(national, water) | \n", - "3 | \n", - "
(system, simulation) | \n", - "3 | \n", - "
(software, platform) | \n", - "3 | \n", - "
(learning, techniques) | \n", - "3 | \n", - "
(models, used) | \n", - "3 | \n", - "
(climate, sciences) | \n", - "3 | \n", - "
(system, simulator) | \n", - "3 | \n", - "
(environmental, protection) | \n", - "3 | \n", - "
(land, change) | \n", - "3 | \n", - "
(carbon, nitrogen) | \n", - "3 | \n", - "
(oceanic, climate) | \n", - "3 | \n", - "
(visualize, results) | \n", - "3 | \n", - "
(learning, environment) | \n", - "3 | \n", - "
(provides, framework) | \n", - "3 | \n", - "
(models, building) | \n", - "3 | \n", - "
(aims, providing) | \n", - "3 | \n", - "
(soil, properties) | \n", - "3 | \n", - "
(demand, response) | \n", - "3 | \n", - "
(platform, developed) | \n", - "3 | \n", - "
(sentinel, satellite) | \n", - "3 | \n", - "
(carbon, aware) | \n", - "3 | \n", - "
(provides, interface) | \n", - "3 | \n", - "
(plastic, pollution) | \n", - "3 | \n", - "
(dimensional, water) | \n", - "3 | \n", - "
(multi, energy) | \n", - "3 | \n", - "
(high, quality) | \n", - "3 | \n", - "
(common, platform) | \n", - "3 | \n", - "
(provides, functionality) | \n", - "3 | \n", - "
(provides, methods) | \n", - "3 | \n", - "
(system, grid) | \n", - "3 | \n", - "
(designed, facilitate) | \n", - "3 | \n", - "
(smart, meter) | \n", - "3 | \n", - "
(distribution, networks) | \n", - "3 | \n", - "
(forecasting, system) | \n", - "3 | \n", - "
(tree, crown) | \n", - "3 | \n", - "
(energy, performance) | \n", - "3 | \n", - "
(present, future) | \n", - "3 | \n", - "
(future, climate) | \n", - "3 | \n", - "
(speed, direction) | \n", - "3 | \n", - "
(temporal, resolution) | \n", - "3 | \n", - "
(transmission, system) | \n", - "3 | \n", - "
(photovoltaic, energy) | \n", - "3 | \n", - "
(lagrangian, particle) | \n", - "3 | \n", - "
(social, environmental) | \n", - "3 | \n", - "
(ocean, climate) | \n", - "3 | \n", - "
(smart, energy) | \n", - "3 | \n", - "
(image, analysis) | \n", - "3 | \n", - "
(energy, meter) | \n", - "3 | \n", - "
(energy, resource) | \n", - "3 | \n", - "
(library, building) | \n", - "3 | \n", - "
\n", - " | description | \n", - "
---|---|
0 | \n", - "acoustic area backscattering strength in sea w... | \n", - "
1 | \n", - "acoustic signal roundtrip travel time in sea w... | \n", - "
2 | \n", - "acoustic target strength in sea water | \n", - "
3 | \n", - "acoustic volume backscattering strength in sea... | \n", - "
4 | \n", - "aerodynamic particle diameter | \n", - "
... | \n", - "... | \n", - "
4663 | \n", - "y heat flux in sea water due to advection | \n", - "
4664 | \n", - "y wind | \n", - "
4665 | \n", - "y wind gust | \n", - "
4666 | \n", - "zenith angle | \n", - "
4667 | \n", - "\n", - " |
4668 rows × 1 columns
\n", - "\n", - " | count | \n", - "
---|---|
(radioactivity, concentration) | \n", - "726 | \n", - "
(mass, content) | \n", - "663 | \n", - "
(atmosphere, mass) | \n", - "614 | \n", - "
(tendency, atmosphere) | \n", - "583 | \n", - "
(content, surface) | \n", - "367 | \n", - "
(integral, radioactivity) | \n", - "363 | \n", - "
(radioactivity, content) | \n", - "363 | \n", - "
(concentration, integral) | \n", - "363 | \n", - "
(surface, radioactivity) | \n", - "363 | \n", - "
(concentration, radioactivity) | \n", - "362 | \n", - "
(aerosol, particles) | \n", - "269 | \n", - "
(mass, fraction) | \n", - "222 | \n", - "
(mole, concentration) | \n", - "203 | \n", - "
(mass, concentration) | \n", - "196 | \n", - "
(atmosphere, moles) | \n", - "187 | \n", - "
(expressed, carbon) | \n", - "136 | \n", - "
(mole, fraction) | \n", - "133 | \n", - "
(deposition, tendency) | \n", - "108 | \n", - "
(mass, flux) | \n", - "89 | \n", - "
(emission, tendency) | \n", - "81 | \n", - "
(expressed, nitrogen) | \n", - "78 | \n", - "
(water, mole) | \n", - "78 | \n", - "
(particles, mass) | \n", - "73 | \n", - "
(ambient, aerosol) | \n", - "71 | \n", - "
(particulate, organic) | \n", - "66 | \n", - "
(organic, matter) | \n", - "66 | \n", - "
(tendency, mass) | \n", - "65 | \n", - "
(water, mass) | \n", - "65 | \n", - "
(liquid, water) | \n", - "63 | \n", - "
(stratiform, cloud) | \n", - "63 | \n", - "
(surface, downward) | \n", - "62 | \n", - "
(flux, water) | \n", - "61 | \n", - "
(fires, tendency) | \n", - "60 | \n", - "
(carbon, dioxide) | \n", - "59 | \n", - "
(mole, content) | \n", - "55 | \n", - "
(surface, upward) | \n", - "54 | \n", - "
(carbon, water) | \n", - "53 | \n", - "
(water, velocity) | \n", - "52 | \n", - "
(particles, deposition) | \n", - "51 | \n", - "
(fraction, stratiform) | \n", - "49 | \n", - "
(heat, flux) | \n", - "48 | \n", - "
(production, tendency) | \n", - "48 | \n", - "
(combustion, tendency) | \n", - "48 | \n", - "
(cloud, liquid) | \n", - "47 | \n", - "
(shortwave, flux) | \n", - "46 | \n", - "
(water, surface) | \n", - "44 | \n", - "
(emission, agricultural) | \n", - "44 | \n", - "
(flux, carbon) | \n", - "43 | \n", - "
(matter, aerosol) | \n", - "43 | \n", - "
(tendency, ocean) | \n", - "43 | \n", - "
(transport, tendency) | \n", - "41 | \n", - "
(content, nitrogen) | \n", - "41 | \n", - "
(upward, mass) | \n", - "39 | \n", - "
(surface, wave) | \n", - "39 | \n", - "
(water, vapor) | \n", - "39 | \n", - "
(flux, surface) | \n", - "38 | \n", - "
(ocean, mole) | \n", - "38 | \n", - "
(content, carbon) | \n", - "38 | \n", - "
(carbon, aerosol) | \n", - "38 | \n", - "
(advection, tendency) | \n", - "37 | \n", - "
(monoxide, emission) | \n", - "36 | \n", - "
(assuming, clear) | \n", - "35 | \n", - "
(tendency, water) | \n", - "35 | \n", - "
(dioxide, expressed) | \n", - "33 | \n", - "
(particles, atmosphere) | \n", - "33 | \n", - "
(surface, downwelling) | \n", - "32 | \n", - "
(surface, snow) | \n", - "32 | \n", - "
(swell, wave) | \n", - "32 | \n", - "
(spectral, density) | \n", - "32 | \n", - "
(variance, spectral) | \n", - "32 | \n", - "
(content, water) | \n", - "32 | \n", - "
(radiative, flux) | \n", - "32 | \n", - "
(matter, expressed) | \n", - "32 | \n", - "
(nitrogen, monoxide) | \n", - "31 | \n", - "
(eddy, advection) | \n", - "31 | \n", - "
(content, atmosphere) | \n", - "31 | \n", - "
(savanna, grassland) | \n", - "30 | \n", - "
(emission, forest) | \n", - "30 | \n", - "
(grassland, fires) | \n", - "30 | \n", - "
(emission, savanna) | \n", - "30 | \n", - "
(fraction, mole) | \n", - "30 | \n", - "
(forest, fires) | \n", - "30 | \n", - "
(longwave, flux) | \n", - "29 | \n", - "
(convective, cloud) | \n", - "29 | \n", - "
(water, temperature) | \n", - "29 | \n", - "
(mass, water) | \n", - "29 | \n", - "
(concentration, dissolved) | \n", - "28 | \n", - "
(compounds, expressed) | \n", - "28 | \n", - "
(nitrogen, compounds) | \n", - "28 | \n", - "
(energy, content) | \n", - "28 | \n", - "
(particles, expressed) | \n", - "27 | \n", - "
(salt, aerosol) | \n", - "27 | \n", - "
(water, moles) | \n", - "27 | \n", - "
(flux, assuming) | \n", - "27 | \n", - "
(concentration, particulate) | \n", - "27 | \n", - "
(optical, thickness) | \n", - "26 | \n", - "
(surface, height) | \n", - "26 | \n", - "
(elemental, carbon) | \n", - "26 | \n", - "
(content, particulate) | \n", - "26 | \n", - "
(minus, tendency) | \n", - "26 | \n", - "
(wave, period) | \n", - "25 | \n", - "
(tendency, mole) | \n", - "25 | \n", - "
(eastward, wind) | \n", - "25 | \n", - "
(waste, treatment) | \n", - "25 | \n", - "
(disposal, tendency) | \n", - "25 | \n", - "
(treatment, disposal) | \n", - "25 | \n", - "
(carbon, monoxide) | \n", - "25 | \n", - "
(dissolved, inorganic) | \n", - "25 | \n", - "
(emission, waste) | \n", - "25 | \n", - "
(land, transport) | \n", - "24 | \n", - "
(residential, combustion) | \n", - "24 | \n", - "
(emission, land) | \n", - "24 | \n", - "
(emission, residential) | \n", - "24 | \n", - "
(particles, emission) | \n", - "24 | \n", - "
(production, distribution) | \n", - "23 | \n", - "
(agricultural, waste) | \n", - "23 | \n", - "
(emission, industrial) | \n", - "23 | \n", - "
(distribution, tendency) | \n", - "23 | \n", - "
(dust, aerosol) | \n", - "23 | \n", - "
(carbon, emission) | \n", - "23 | \n", - "
(emission, energy) | \n", - "23 | \n", - "
(industrial, combustion) | \n", - "23 | \n", - "
(burning, tendency) | \n", - "23 | \n", - "
(waste, burning) | \n", - "23 | \n", - "
(nmvoc, expressed) | \n", - "23 | \n", - "
(energy, production) | \n", - "23 | \n", - "
(northward, wind) | \n", - "22 | \n", - "
(tendency, temperature) | \n", - "22 | \n", - "
(sulfur, dioxide) | \n", - "22 | \n", - "
(condensed, water) | \n", - "22 | \n", - "
(deposition, minus) | \n", - "22 | \n", - "
(nitrogen, water) | \n", - "22 | \n", - "
(nitrogen, deposition) | \n", - "21 | \n", - "
(agricultural, production) | \n", - "21 | \n", - "
(content, elemental) | \n", - "21 | \n", - "
(maximum, surface) | \n", - "19 | \n", - "
(water, downwelling) | \n", - "19 | \n", - "
(carbon, mass) | \n", - "19 | \n", - "
(biomass, expressed) | \n", - "19 | \n", - "
(chlorophyll, water) | \n", - "19 | \n", - "
(number, concentration) | \n", - "19 | \n", - "
(content, expressed) | \n", - "19 | \n", - "
(density, maximum) | \n", - "19 | \n", - "
(expressed, heat) | \n", - "19 | \n", - "
(water, salinity) | \n", - "19 | \n", - "
(water, flux) | \n", - "19 | \n", - "
(surface, swell) | \n", - "18 | \n", - "
(northward, ocean) | \n", - "18 | \n", - "
(sulfate, aerosol) | \n", - "18 | \n", - "
(surface, upwelling) | \n", - "18 | \n", - "
(parameterized, mesoscale) | \n", - "18 | \n", - "
(maritime, transport) | \n", - "17 | \n", - "
(moles, tendency) | \n", - "17 | \n", - "
(water, soil) | \n", - "17 | \n", - "
(downwelling, shortwave) | \n", - "17 | \n", - "
(wavelength, water) | \n", - "17 | \n", - "
(emission, maritime) | \n", - "17 | \n", - "
(nitrogen, dioxide) | \n", - "16 | \n", - "
(productivity, biomass) | \n", - "16 | \n", - "
(content, parameterized) | \n", - "16 | \n", - "
(nitric, acid) | \n", - "16 | \n", - "
(soil, mass) | \n", - "16 | \n", - "
(downwelling, photosynthetic) | \n", - "16 | \n", - "
(content, salt) | \n", - "16 | \n", - "
(land, surface) | \n", - "16 | \n", - "
(content, dust) | \n", - "16 | \n", - "
(heat, content) | \n", - "16 | \n", - "
(content, sulfur) | \n", - "16 | \n", - "
(northward, water) | \n", - "16 | \n", - "
(cloud, condensed) | \n", - "16 | \n", - "
(eastward, water) | \n", - "16 | \n", - "
(temperature, expressed) | \n", - "16 | \n", - "
(atmosphere, mole) | \n", - "16 | \n", - "
(atmosphere, optical) | \n", - "16 | \n", - "
(methane, emission) | \n", - "16 | \n", - "
(content, sulfate) | \n", - "15 | \n", - "
(convection, tendency) | \n", - "15 | \n", - "
(mixing, tendency) | \n", - "15 | \n", - "
(dioxide, emission) | \n", - "15 | \n", - "
(content, organic) | \n", - "15 | \n", - "
(nitrogen, mass) | \n", - "15 | \n", - "
(acid, mass) | \n", - "15 | \n", - "
(period, variance) | \n", - "15 | \n", - "
(ocean, heat) | \n", - "15 | \n", - "
(growth, limitation) | \n", - "15 | \n", - "
(particulate, matter) | \n", - "15 | \n", - "
(parameterized, eddy) | \n", - "15 | \n", - "
(heat, transport) | \n", - "15 | \n", - "
(effective, radius) | \n", - "14 | \n", - "
(concentration, mole) | \n", - "14 | \n", - "
(concentration, mass) | \n", - "14 | \n", - "
(acid, mole) | \n", - "14 | \n", - "
(cloud, fraction) | \n", - "14 | \n", - "
(content, emission) | \n", - "14 | \n", - "
(moles, atmosphere) | \n", - "14 | \n", - "
(downward, mass) | \n", - "14 | \n", - "
(content, ammonia) | \n", - "14 | \n", - "
(dimethyl, sulfide) | \n", - "14 | \n", - "
(content, formaldehyde) | \n", - "14 | \n", - "
(fraction, mass) | \n", - "14 | \n", - "
(advection, ocean) | \n", - "14 | \n", - "
(temperature, water) | \n", - "14 | \n", - "
(content, nmvoc) | \n", - "14 | \n", - "
(mole, flux) | \n", - "14 | \n", - "
(acid, atmosphere) | \n", - "14 | \n", - "
(inorganic, carbon) | \n", - "14 | \n", - "
(spherical, irradiance) | \n", - "14 | \n", - "
(content, methane) | \n", - "14 | \n", - "
(content, xylene) | \n", - "13 | \n", - "
(amount, thickness) | \n", - "13 | \n", - "
(fraction, cloud) | \n", - "13 | \n", - "
(content, toluene) | \n", - "13 | \n", - "
(ocean, tracer) | \n", - "13 | \n", - "
(mesoscale, eddy) | \n", - "13 | \n", - "
(velocity, surface) | \n", - "13 | \n", - "
(radiance, wavelength) | \n", - "13 | \n", - "
(molecular, hydrogen) | \n", - "13 | \n", - "
(phytoplankton, expressed) | \n", - "13 | \n", - "
(kinetic, energy) | \n", - "13 | \n", - "
(content, ethane) | \n", - "12 | \n", - "
(xylene, emission) | \n", - "12 | \n", - "
(content, butane) | \n", - "12 | \n", - "
(wind, wave) | \n", - "12 | \n", - "
(vapor, atmosphere) | \n", - "12 | \n", - "
(nitrous, oxide) | \n", - "12 | \n", - "
(downward, stress) | \n", - "12 | \n", - "
(content, propane) | \n", - "12 | \n", - "
(content, propene) | \n", - "12 | \n", - "
(salinity, water) | \n", - "12 | \n", - "
(toluene, emission) | \n", - "12 | \n", - "
(content, ethyne) | \n", - "12 | \n", - "
(content, ethene) | \n", - "12 | \n", - "
(partial, pressure) | \n", - "12 | \n", - "
(surface, wind) | \n", - "12 | \n", - "
(conservative, temperature) | \n", - "12 | \n", - "
(downwelling, photon) | \n", - "12 | \n", - "
(content, dissolved) | \n", - "12 | \n", - "
(nmvoc, emission) | \n", - "12 | \n", - "
(water, particles) | \n", - "12 | \n", - "
(water, sinking) | \n", - "12 | \n", - "
(precipitation, flux) | \n", - "12 | \n", - "
(moles, methyl) | \n", - "12 | \n", - "
(diffusivity, ocean) | \n", - "12 | \n", - "
(downward, shortwave) | \n", - "12 | \n", - "
(ocean, mass) | \n", - "11 | \n", - "
(content, aerosol) | \n", - "11 | \n", - "
(propane, emission) | \n", - "11 | \n", - "
(propene, emission) | \n", - "11 | \n", - "
(litter, soil) | \n", - "11 | \n", - "
(flux, particulate) | \n", - "11 | \n", - "
(stress, surface) | \n", - "11 | \n", - "
(ethyne, emission) | \n", - "11 | \n", - "
(agricultural, products) | \n", - "11 | \n", - "
(forestry, agricultural) | \n", - "11 | \n", - "
(height, surface) | \n", - "11 | \n", - "
(biological, tendency) | \n", - "11 | \n", - "
(concentration, carbon) | \n", - "11 | \n", - "
(ethene, emission) | \n", - "11 | \n", - "
(radiance, water) | \n", - "11 | \n", - "
(butane, emission) | \n", - "11 | \n", - "
(ethane, emission) | \n", - "11 | \n", - "
(water, amount) | \n", - "11 | \n", - "
(moment, surface) | \n", - "11 | \n", - "
(alpha, hexachlorocyclohexane) | \n", - "11 | \n", - "
(dioxide, atmosphere) | \n", - "11 | \n", - "
(water, cloud) | \n", - "11 | \n", - "
(content, benzene) | \n", - "11 | \n", - "
(downward, heat) | \n", - "11 | \n", - "
(tendency, eastward) | \n", - "11 | \n", - "
(biological, production) | \n", - "11 | \n", - "
(gaseous, divalent) | \n", - "10 | \n", - "
(gaseous, elemental) | \n", - "10 | \n", - "
(elemental, mercury) | \n", - "10 | \n", - "
(formaldehyde, emission) | \n", - "10 | \n", - "
(methyl, bromide) | \n", - "10 | \n", - "
(salt, flux) | \n", - "10 | \n", - "
(methyl, chloride) | \n", - "10 | \n", - "
(upwelling, radiance) | \n", - "10 | \n", - "
(water, density) | \n", - "10 | \n", - "
(divalent, mercury) | \n", - "10 | \n", - "
(backwards, scattering) | \n", - "10 | \n", - "
(benzene, emission) | \n", - "10 | \n", - "
(biological, taxon) | \n", - "10 | \n", - "
(snow, amount) | \n", - "10 | \n", - "
(iron, water) | \n", - "10 | \n", - "
(flux, upward) | \n", - "10 | \n", - "
(hydrogen, peroxide) | \n", - "10 | \n", - "
(upward, velocity) | \n", - "10 | \n", - "
(nitrous, acid) | \n", - "10 | \n", - "
(tropical, cyclone) | \n", - "10 | \n", - "
(velocity, land) | \n", - "10 | \n", - "
(diffusion, tendency) | \n", - "10 | \n", - "
(dissolved, organic) | \n", - "10 | \n", - "
(downward, longwave) | \n", - "10 | \n", - "
(wave, surface) | \n", - "10 | \n", - "
(particles, number) | \n", - "10 | \n", - "
(flux, wavelength) | \n", - "10 | \n", - "
(period, surface) | \n", - "10 | \n", - "
(northward, stress) | \n", - "10 | \n", - "
(water, evaporation) | \n", - "10 | \n", - "