Skip to content

Instantly share code, notes, and snippets.

@jiffyclub
Created June 8, 2016 22:01
Show Gist options
  • Select an option

  • Save jiffyclub/6c548b2ecec33b36076cee87f85f2917 to your computer and use it in GitHub Desktop.

Select an option

Save jiffyclub/6c548b2ecec33b36076cee87f85f2917 to your computer and use it in GitHub Desktop.

Revisions

  1. jiffyclub created this gist Jun 8, 2016.
    397 changes: 397 additions & 0 deletions dataframe_concatenation.ipynb
    Original file line number Diff line number Diff line change
    @@ -0,0 +1,397 @@
    {
    "cells": [
    {
    "cell_type": "code",
    "execution_count": 1,
    "metadata": {
    "collapsed": true
    },
    "outputs": [],
    "source": [
    "import pandas as pd"
    ]
    },
    {
    "cell_type": "code",
    "execution_count": 2,
    "metadata": {
    "collapsed": false
    },
    "outputs": [
    {
    "data": {
    "text/html": [
    "<div>\n",
    "<table border=\"1\" class=\"dataframe\">\n",
    " <thead>\n",
    " <tr style=\"text-align: right;\">\n",
    " <th></th>\n",
    " <th>0</th>\n",
    " <th>1</th>\n",
    " <th>2</th>\n",
    " <th>3</th>\n",
    " <th>4</th>\n",
    " <th>5</th>\n",
    " <th>6</th>\n",
    " <th>7</th>\n",
    " <th>8</th>\n",
    " <th>9</th>\n",
    " <th>10</th>\n",
    " <th>11</th>\n",
    " <th>Account</th>\n",
    " <th>Source</th>\n",
    " </tr>\n",
    " </thead>\n",
    " <tbody>\n",
    " <tr>\n",
    " <th>0</th>\n",
    " <td>0</td>\n",
    " <td>1</td>\n",
    " <td>2</td>\n",
    " <td>3</td>\n",
    " <td>4</td>\n",
    " <td>5</td>\n",
    " <td>6</td>\n",
    " <td>7</td>\n",
    " <td>8</td>\n",
    " <td>9</td>\n",
    " <td>10</td>\n",
    " <td>11</td>\n",
    " <td>asdf</td>\n",
    " <td>qwer</td>\n",
    " </tr>\n",
    " <tr>\n",
    " <th>1</th>\n",
    " <td>12</td>\n",
    " <td>13</td>\n",
    " <td>14</td>\n",
    " <td>15</td>\n",
    " <td>16</td>\n",
    " <td>17</td>\n",
    " <td>18</td>\n",
    " <td>19</td>\n",
    " <td>20</td>\n",
    " <td>21</td>\n",
    " <td>22</td>\n",
    " <td>23</td>\n",
    " <td>yuiop</td>\n",
    " <td>hjkl</td>\n",
    " </tr>\n",
    " </tbody>\n",
    "</table>\n",
    "</div>"
    ],
    "text/plain": [
    " 0 1 2 3 4 5 6 7 8 9 10 11 Account Source\n",
    "0 0 1 2 3 4 5 6 7 8 9 10 11 asdf qwer\n",
    "1 12 13 14 15 16 17 18 19 20 21 22 23 yuiop hjkl"
    ]
    },
    "execution_count": 2,
    "metadata": {},
    "output_type": "execute_result"
    }
    ],
    "source": [
    "df = pd.DataFrame(\n",
    " [list(range(12)) + ['asdf', 'qwer'],\n",
    " list(range(12, 24)) + ['yuiop', 'hjkl']],\n",
    " columns=[str(i) for i in range(12)] + ['Account', 'Source'])\n",
    "df"
    ]
    },
    {
    "cell_type": "code",
    "execution_count": 3,
    "metadata": {
    "collapsed": true
    },
    "outputs": [],
    "source": [
    "df_first = df[['0', '1', '2', '3', '4', '5', 'Account', 'Source']]\n",
    "df_second = df[['6', '7', '8', '9', '10', '11', 'Account', 'Source']]"
    ]
    },
    {
    "cell_type": "code",
    "execution_count": 4,
    "metadata": {
    "collapsed": false
    },
    "outputs": [
    {
    "data": {
    "text/html": [
    "<div>\n",
    "<table border=\"1\" class=\"dataframe\">\n",
    " <thead>\n",
    " <tr style=\"text-align: right;\">\n",
    " <th></th>\n",
    " <th>0</th>\n",
    " <th>1</th>\n",
    " <th>2</th>\n",
    " <th>3</th>\n",
    " <th>4</th>\n",
    " <th>5</th>\n",
    " <th>Account</th>\n",
    " <th>Source</th>\n",
    " </tr>\n",
    " </thead>\n",
    " <tbody>\n",
    " <tr>\n",
    " <th>0</th>\n",
    " <td>6</td>\n",
    " <td>7</td>\n",
    " <td>8</td>\n",
    " <td>9</td>\n",
    " <td>10</td>\n",
    " <td>11</td>\n",
    " <td>asdf</td>\n",
    " <td>qwer</td>\n",
    " </tr>\n",
    " <tr>\n",
    " <th>1</th>\n",
    " <td>18</td>\n",
    " <td>19</td>\n",
    " <td>20</td>\n",
    " <td>21</td>\n",
    " <td>22</td>\n",
    " <td>23</td>\n",
    " <td>yuiop</td>\n",
    " <td>hjkl</td>\n",
    " </tr>\n",
    " </tbody>\n",
    "</table>\n",
    "</div>"
    ],
    "text/plain": [
    " 0 1 2 3 4 5 Account Source\n",
    "0 6 7 8 9 10 11 asdf qwer\n",
    "1 18 19 20 21 22 23 yuiop hjkl"
    ]
    },
    "execution_count": 4,
    "metadata": {},
    "output_type": "execute_result"
    }
    ],
    "source": [
    "df_second = df_second.rename(\n",
    " columns={'6': '0', '7': '1', '8': '2', '9': '3', '10': '4', '11': '5'})\n",
    "df_second"
    ]
    },
    {
    "cell_type": "code",
    "execution_count": 5,
    "metadata": {
    "collapsed": false
    },
    "outputs": [
    {
    "data": {
    "text/html": [
    "<div>\n",
    "<table border=\"1\" class=\"dataframe\">\n",
    " <thead>\n",
    " <tr style=\"text-align: right;\">\n",
    " <th></th>\n",
    " <th>0</th>\n",
    " <th>1</th>\n",
    " <th>2</th>\n",
    " <th>3</th>\n",
    " <th>4</th>\n",
    " <th>5</th>\n",
    " <th>Account</th>\n",
    " <th>Source</th>\n",
    " </tr>\n",
    " </thead>\n",
    " <tbody>\n",
    " <tr>\n",
    " <th>0</th>\n",
    " <td>0</td>\n",
    " <td>1</td>\n",
    " <td>2</td>\n",
    " <td>3</td>\n",
    " <td>4</td>\n",
    " <td>5</td>\n",
    " <td>asdf</td>\n",
    " <td>qwer</td>\n",
    " </tr>\n",
    " <tr>\n",
    " <th>1</th>\n",
    " <td>12</td>\n",
    " <td>13</td>\n",
    " <td>14</td>\n",
    " <td>15</td>\n",
    " <td>16</td>\n",
    " <td>17</td>\n",
    " <td>yuiop</td>\n",
    " <td>hjkl</td>\n",
    " </tr>\n",
    " <tr>\n",
    " <th>2</th>\n",
    " <td>6</td>\n",
    " <td>7</td>\n",
    " <td>8</td>\n",
    " <td>9</td>\n",
    " <td>10</td>\n",
    " <td>11</td>\n",
    " <td>asdf</td>\n",
    " <td>qwer</td>\n",
    " </tr>\n",
    " <tr>\n",
    " <th>3</th>\n",
    " <td>18</td>\n",
    " <td>19</td>\n",
    " <td>20</td>\n",
    " <td>21</td>\n",
    " <td>22</td>\n",
    " <td>23</td>\n",
    " <td>yuiop</td>\n",
    " <td>hjkl</td>\n",
    " </tr>\n",
    " </tbody>\n",
    "</table>\n",
    "</div>"
    ],
    "text/plain": [
    " 0 1 2 3 4 5 Account Source\n",
    "0 0 1 2 3 4 5 asdf qwer\n",
    "1 12 13 14 15 16 17 yuiop hjkl\n",
    "2 6 7 8 9 10 11 asdf qwer\n",
    "3 18 19 20 21 22 23 yuiop hjkl"
    ]
    },
    "execution_count": 5,
    "metadata": {},
    "output_type": "execute_result"
    }
    ],
    "source": [
    "df_first.append(df_second, ignore_index=True)"
    ]
    },
    {
    "cell_type": "code",
    "execution_count": 7,
    "metadata": {
    "collapsed": false
    },
    "outputs": [
    {
    "data": {
    "text/html": [
    "<div>\n",
    "<table border=\"1\" class=\"dataframe\">\n",
    " <thead>\n",
    " <tr style=\"text-align: right;\">\n",
    " <th></th>\n",
    " <th>0</th>\n",
    " <th>1</th>\n",
    " <th>2</th>\n",
    " <th>3</th>\n",
    " <th>4</th>\n",
    " <th>5</th>\n",
    " <th>Account</th>\n",
    " <th>Source</th>\n",
    " </tr>\n",
    " </thead>\n",
    " <tbody>\n",
    " <tr>\n",
    " <th>0</th>\n",
    " <td>0</td>\n",
    " <td>1</td>\n",
    " <td>2</td>\n",
    " <td>3</td>\n",
    " <td>4</td>\n",
    " <td>5</td>\n",
    " <td>asdf</td>\n",
    " <td>qwer</td>\n",
    " </tr>\n",
    " <tr>\n",
    " <th>1</th>\n",
    " <td>12</td>\n",
    " <td>13</td>\n",
    " <td>14</td>\n",
    " <td>15</td>\n",
    " <td>16</td>\n",
    " <td>17</td>\n",
    " <td>yuiop</td>\n",
    " <td>hjkl</td>\n",
    " </tr>\n",
    " <tr>\n",
    " <th>2</th>\n",
    " <td>6</td>\n",
    " <td>7</td>\n",
    " <td>8</td>\n",
    " <td>9</td>\n",
    " <td>10</td>\n",
    " <td>11</td>\n",
    " <td>asdf</td>\n",
    " <td>qwer</td>\n",
    " </tr>\n",
    " <tr>\n",
    " <th>3</th>\n",
    " <td>18</td>\n",
    " <td>19</td>\n",
    " <td>20</td>\n",
    " <td>21</td>\n",
    " <td>22</td>\n",
    " <td>23</td>\n",
    " <td>yuiop</td>\n",
    " <td>hjkl</td>\n",
    " </tr>\n",
    " </tbody>\n",
    "</table>\n",
    "</div>"
    ],
    "text/plain": [
    " 0 1 2 3 4 5 Account Source\n",
    "0 0 1 2 3 4 5 asdf qwer\n",
    "1 12 13 14 15 16 17 yuiop hjkl\n",
    "2 6 7 8 9 10 11 asdf qwer\n",
    "3 18 19 20 21 22 23 yuiop hjkl"
    ]
    },
    "execution_count": 7,
    "metadata": {},
    "output_type": "execute_result"
    }
    ],
    "source": [
    "pd.concat([df_first, df_second], ignore_index=True)"
    ]
    },
    {
    "cell_type": "code",
    "execution_count": null,
    "metadata": {
    "collapsed": true
    },
    "outputs": [],
    "source": []
    }
    ],
    "metadata": {
    "kernelspec": {
    "display_name": "Python 3",
    "language": "python",
    "name": "python3"
    },
    "language_info": {
    "codemirror_mode": {
    "name": "ipython",
    "version": 3
    },
    "file_extension": ".py",
    "mimetype": "text/x-python",
    "name": "python",
    "nbconvert_exporter": "python",
    "pygments_lexer": "ipython3",
    "version": "3.5.1"
    }
    },
    "nbformat": 4,
    "nbformat_minor": 0
    }