data-science-ipython-notebooks/commands/linux.ipynb

428 lines
9.3 KiB
Plaintext
Raw Normal View History

{
"metadata": {
"name": "",
"signature": "sha256:4515e5f88373961da62945f02e97b93ca0c73478b952696d14d5cd396af307f1"
},
"nbformat": 3,
"nbformat_minor": 0,
"worksheets": [
{
"cells": [
{
"cell_type": "markdown",
"metadata": {},
"source": [
"# Linux Commands\n",
"\n",
"* Disk Usage\n",
"* Splitting Files\n",
"* Grep\n",
"* Compression\n",
2015-03-02 05:27:48 +08:00
"* Curl\n",
"* View Running Processes\n",
2015-03-01 21:16:23 +08:00
"* Terminal Syntax Highlighting\n",
"* Vim"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"## Disk Usage"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"Display human-readable (-h) free disk space:"
]
},
{
"cell_type": "code",
"collapsed": false,
"input": [
"df -h"
],
"language": "python",
"metadata": {},
"outputs": []
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"Display human-readable (-h) disk usage statistics:"
]
},
{
"cell_type": "code",
"collapsed": false,
"input": [
"du -h ./"
],
"language": "python",
"metadata": {},
"outputs": []
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"Display human-readable (-h) disk usage statistics, showing only the total usage (-s):"
]
},
{
"cell_type": "code",
"collapsed": false,
"input": [
"du -sh ../"
],
"language": "python",
"metadata": {},
"outputs": []
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"Display the human-readable (-h) disk usage statistics, showing also the grand total for all file types (-c):"
]
},
{
"cell_type": "code",
"collapsed": false,
"input": [
"du -csh ./"
],
"language": "python",
"metadata": {},
"outputs": []
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"## Splitting Files"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"Count number of lines in a file with wc:"
]
},
{
"cell_type": "code",
"collapsed": false,
"input": [
"wc -l < file.txt"
],
"language": "python",
"metadata": {},
"outputs": []
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"Count the number of lines in a file with grep:"
]
},
{
"cell_type": "code",
"collapsed": false,
"input": [
"grep -c \".\" file.txt"
],
"language": "python",
"metadata": {},
"outputs": []
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"Split a file into multiple files based on line count:"
]
},
{
"cell_type": "code",
"collapsed": false,
"input": [
"split -l 20 file.txt new"
],
"language": "python",
"metadata": {},
"outputs": []
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"Split a file into multiple files based on line count, use suffix of length 1:"
]
},
{
"cell_type": "code",
"collapsed": false,
"input": [
"split -l 802 -a 1 file.csv dir/part-user-csv.tbl-"
],
"language": "python",
"metadata": {},
"outputs": []
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"## Grep"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"Check number of files matching \u201c.txt\":"
]
},
{
"cell_type": "code",
"collapsed": false,
"input": [
"ls -1 | grep .txt | wc -l"
],
"language": "python",
"metadata": {},
"outputs": []
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"Check number of MapReduce records processed, outputting the results to the terminal:"
]
},
{
"cell_type": "code",
"collapsed": false,
"input": [
"cat * | grep -c \"foo\" folder/part*"
],
"language": "python",
"metadata": {},
"outputs": []
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"## Compression"
]
},
{
"cell_type": "code",
"collapsed": false,
"input": [
"# Compress zip\n",
"zip -r archive_name.zip folder_to_compress\n",
"\n",
"# Compress zip without invisible Mac resources\n",
"zip -r -X archive_name.zip folder_to_compress\n",
"\n",
"# Extract zip\n",
"unzip archive_name.zip\n",
"\n",
"# Compress TAR.GZ\n",
"tar -zcvf archive_name.tar.gz folder_to_compress\n",
"\n",
"# Extract TAR.GZ\n",
"tar -zxvf archive_name.tar.gz\n",
"\n",
"# Compress TAR.BZ2\n",
"tar -jcvf archive_name.tar.bz2 folder_to_compress\n",
"\n",
"# Extract TAR.BZ2\n",
"tar -jxvf archive_name.tar.bz2\n",
"\n",
"# Extract GZ\n",
"gunzip archivename.gz\n",
"\n",
"# Uncompress all tar.gz in current directory to another directory\n",
"for i in *.tar.gz; do echo working on $i; tar xvzf $i -C directory/ ; done"
],
"language": "python",
"metadata": {},
"outputs": []
},
2015-03-02 05:27:48 +08:00
{
"cell_type": "markdown",
"metadata": {},
"source": [
"## Curl"
]
},
{
"cell_type": "code",
"collapsed": false,
"input": [
"# Display the curl output:\n",
"curl donnemartin.com\n",
"\n",
"# Download the curl output to a file:\n",
"curl donnemartin.com > donnemartin.html\n",
"\n",
"# Download the curl output to a file -o\n",
"curl -o image.png http://i1.wp.com/donnemartin.com/wp-content/uploads/2015/02/splunk_cover.png\n",
"\n",
"# Download the curl output to a file, keeping the original file name -O\n",
"curl -O http://i1.wp.com/donnemartin.com/wp-content/uploads/2015/02/splunk_cover.png\n",
" \n",
"# Download multiple files, attempting to reuse the same connection\n",
"curl -O url1 -O url2\n",
"\n",
"# Follow redirects -L\n",
"curl -L url\n",
"\n",
"# Resume a previous download -C -\n",
"curl -C - -O url\n",
"\n",
"# Authenticate -u\n",
"curl -u username:password url"
],
"language": "python",
"metadata": {},
"outputs": []
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"## View Running Processes"
]
},
{
"cell_type": "code",
"collapsed": false,
"input": [
"# Display sorted info about processes\n",
"top\n",
"\n",
"# Display all running processes\n",
"ps aux | less\n",
"\n",
"# See processes run by user dmartin\n",
"ps -u dmartin\n",
"\n",
"# Display running processes as a tree\n",
"pstree"
],
"language": "python",
"metadata": {},
"outputs": []
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"## Terminal Syntax Highlighting"
]
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"Add the following to your ~/.bash_profile:"
]
},
{
"cell_type": "code",
"collapsed": false,
"input": [
"export PS1='\\[\\033[01;32m\\]\\u@\\h\\[\\033[00m\\]:\\[\\033[01;34m\\]\\W\\[\\033[00m\\]\\$ '\n",
"export CLICOLOR=1\n",
"export LSCOLORS=ExFxBxDxCxegedabagacad\n",
"alias ls='ls -GFh'"
],
"language": "python",
"metadata": {},
"outputs": []
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"Reload .bash_profile:"
]
},
{
"cell_type": "code",
"collapsed": false,
"input": [
"source ~/.bash_profile"
],
"language": "python",
"metadata": {},
"outputs": []
2015-03-01 21:16:23 +08:00
},
{
"cell_type": "markdown",
"metadata": {},
"source": [
"## Vim"
]
},
{
"cell_type": "code",
"collapsed": false,
"input": [
2015-03-01 21:16:23 +08:00
"Normal mode: esc\n",
"\n",
"Basic movement: h, j, k, l\n",
"Word movement: w, W, e, E, b, B\n",
"\n",
"Go to matching parenthesis: %\n",
"Go to start of the line: 0\n",
"Go to end of the line: $\n",
"\n",
"Find character: f\n",
"\n",
"Insert mode: i\n",
"Append to line: A\n",
"\n",
"Delete character: x\n",
"Delete command: d\n",
"Delete line: dd\n",
"\n",
"Replace command: r\n",
"Change command: c\n",
"\n",
"Undo: u (U for all changes on a line)\n",
"Redo: CTRL-R\n",
"\n",
"Copy the current line: yy\n",
"Paste the current line: p (P for paste above cursor)\n",
"\n",
"Quit without saving changes: q!\n",
"Write the current file and quit: :wq\n",
"\n",
"# Run the following command to enable the tutorial\n",
"vimtutor\n",
"\n",
"# Run the following commands to enable syntax colors\n",
"cd ~\n",
"vim .vimrc\n",
"syntax on\n",
":wq"
],
"language": "python",
"metadata": {},
"outputs": []
}
],
"metadata": {}
}
]
}