1. 程式人生 > >Linux中shell檔案操作大全

Linux中shell檔案操作大全

1.建立資料夾
#!/bin/sh
mkdir -m 777 "%%1"

2.建立檔案
#!/bin/sh
touch "%%1"

3.刪除檔案
#!/bin/sh
rm -if "%%1"

4.刪除資料夾
#!/bin/sh
rm -rf "%%1"

5.刪除一個目錄下所有的資料夾
#!/bin/bash
direc="%%1" #$(pwd)
for dir2del in $direc/* ; do
if [ -d $dir2del ]; then
  rm -rf $dir2del
fi
done

6.清空資料夾
#!/bin/bash
direc="%%1" #$(pwd)
rm -if $direc/*
for dir2del in $direc/* ; do
if [ -d $dir2del ]; then
  rm -rf $dir2del
fi
done

7.讀取檔案
#!/bin/sh
7.1.作業系統預設編碼
cat "%%1" | while read line; do
echo $line;
done

7.2.UTF-8編碼
cat "%%1" | while read line; do
echo $line;
done

7.3.分塊讀取
cat "%%1" | while read line; do
echo $line;
done

8.寫入檔案
#!/bin/sh
cat > "%%1" << EOF
%%2
EOF

tee "%%1" > /dev/null << EOF
%%2
EOF

#sed -i '$a %%2' %%2

9.寫入隨機檔案
#!/bin/sh
cat > "%%1" << EOF
%%2
EOF

tee "%%1" > /dev/null << EOF
%%2
EOF

#sed -i '$a %%2' %%2

10.讀取檔案屬性
#!/bin/bash
file=%%1
file=${file:?'必須給出引數'}
if [ ! -e $file ]; then
    echo "$file 不存在"
    exit 1
fi
if [ -d $file ]; then
    echo "$file 是一個目錄"
    if [ -x $file ]; then
        echo "可以"
    else
        echo "不可以"
    fi
    echo "對此進行搜尋"  
elif [ -f $file ]; then
    echo "$file 是一個正規檔案"
else
    echo "$file不是一個正規檔案"
fi
if [ -O $file ]; then
    echo "你是$file的擁有者"
else
    echo "你不是$file的擁有者"
fi
if [ -r $file ]; then
    echo "你對$file擁有"
else
    echo "你並不對$file擁有"
fi
echo "可讀許可權"
if [ -w $file ]; then
    echo "你對$file擁有"
else
    echo "你並不對$file擁有"
fi
echo "可寫許可權"
if [ -x $file -a ! -d $file ]; then
    echo "你擁有對$file"
else
    echo "你並不擁有對$file"
fi
echo "可執行的許可權"

11.寫入檔案屬性
#!/bin/bash
#修改存放在ext2、ext3、ext4、xfs、ubifs、reiserfs、jfs等檔案系統上的檔案或目錄屬性,使用許可權超級使用者。
#一些功能是由Linux核心版本來支援的,如果Linux核心版本低於2.2,那麼許多功能不能實現。同樣-D檢查壓縮檔案中的錯誤的功能,需要2.5.19以上核心才能支援。另外,通過chattr命令修改屬效能夠提高系統的安全性,但是它並不適合所有的目錄。chattr命令不能保護/、/dev、/tmp、/var目錄。
chattr [-RV] [-+=AacDdijsSu] [-v version] 檔案或目錄
  -R:遞迴處理所有的檔案及子目錄。
  -V:詳細顯示修改內容,並列印輸出。
  -:失效屬性。
  +:啟用屬性。
  = :指定屬性。
  A:Atime,告訴系統不要修改對這個檔案的最後訪問時間。
  S:Sync,一旦應用程式對這個檔案執行了寫操作,使系統立刻把修改的結果寫到磁碟。
  a:Append Only,系統只允許在這個檔案之後追加資料,不允許任何程序覆蓋或截斷這個檔案。如果目錄具有這個屬性,系統將只允許在這個目錄下建立和修改檔案,而不允許刪除任何檔案。
  i:Immutable,系統不允許對這個檔案進行任何的修改。如果目錄具有這個屬性,那麼任何的程序只能修改目錄之下的檔案,不允許建立和刪除檔案。
  D:檢查壓縮檔案中的錯誤。
  d:No dump,在進行檔案系統備份時,dump程式將忽略這個檔案。
  C:Compress,系統以透明的方式壓縮這個檔案。從這個檔案讀取時,返回的是解壓之後的資料;而向這個檔案中寫入資料時,資料首先被壓縮之後才寫入磁碟。
  S:Secure Delete,讓系統在刪除這個檔案時,使用0填充檔案所在的區域。
  u:Undelete,當一個應用程式請求刪除這個檔案,系統會保留其資料塊以便以後能夠恢復刪除這個檔案。

12.列舉一個目錄中的所有資料夾
#!/bin/bash
OLDIFS=$IFS
IFS=:
for path in $( find "%%1" -type d -printf "%p$IFS")
do
#"$path"
done
IFS=$OLDIFS

13.複製資料夾
#!/bin/sh
cp -rf "%%1" "%%2"

14.複製一個目錄下所有的資料夾到另一個目錄下
#!/bin/bash
direc="%%1" #$(pwd)
for dir2cp in $direc/* ; do
if [ -d $dir2cp ]; then
  cp $dir2cp "%%2"
fi
done

15.移動資料夾
#!/bin/sh
mv -rf "%%1" "%%2"

16.移動一個目錄下所有的資料夾到另一個目錄下
#!/bin/bash
direc="%%1" #$(pwd)
for dir2mv in $direc/* ; do
if [ -d $dir2mv ]; then
  mv $dir2mv "%%2"
fi
done

17.以一個資料夾的框架在另一個目錄下建立資料夾和空檔案
#!/bin/bash
direc="%%1" #$(pwd)
OLDIFS=$IFS
IFS=:
for path in $( find $direc -type d -printf "%p$IFS")
do
mkdir -p "%%2/${path:${#direc}+1}"
done
IFS=$OLDIFS
#cp -a "%%1" "%%2"

表示式 含義
${#string}
{#string}
1,取得字串長度
string=abc12342341          //等號二邊不要有空格
echo ${#string}             //結果11
expr length $string         //結果11
expr "$string" : ".*"       //結果11 分號二邊要有空格,這裡的:根match的用法差不多2,字串所在位置
expr index $string '123'    //結果4 字串對應的下標是從0開始的這個方法讓我想起來了js的indexOf,各種語言對字串的操作方法大方向都差不多,如果有語言基礎的話,學習shell會很快的。
3,從字串開頭到子串的最大長度
expr match $string 'abc.*3' //結果9個人覺得這個函式的用處不大,為什麼要從開頭開始呢。
4,字串擷取
echo ${string:4}      //2342341  從第4位開始擷取後面所有字串
echo ${string:3:3}    //123      從第3位開始擷取後面3位
echo ${string:3:6}    //123423   從第3位開始擷取後面6位
echo ${string: -4}    //2341  :右邊有空格   擷取後4位
echo ${string:(-4)}   //2341  同上
expr substr $string 3 3   //123  從第3位開始擷取後面3位上面的方法讓我想起了,php的substr函式,後面擷取的規則是一樣的。
5,匹配顯示內容
//例3中也有match和這裡的match不同,上面顯示的是匹配字元的長度,而下面的是匹配的內容
expr match $string '\([a-c]*[0-9]*\)'  //abc12342341
expr $string : '\([a-c]*[0-9]\)'       //abc1
expr $string : '.*\([0-9][0-9][0-9]\)' //341 顯示括號中匹配的內容這裡括號的用法,是不是根其他的括號用法有相似之處呢,
6,擷取不匹配的內容
echo ${string#a*3}     //42341  從$string左邊開始,去掉最短匹配子串
echo ${string#c*3}     //abc12342341  這樣什麼也沒有匹配到
echo ${string#*c1*3}   //42341  從$string左邊開始,去掉最短匹配子串
echo ${string##a*3}    //41     從$string左邊開始,去掉最長匹配子串
echo ${string%3*1}     //abc12342  從$string右邊開始,去掉最短匹配子串
echo ${string%%3*1}    //abc12     從$string右邊開始,去掉最長匹配子串這裡要注意,必須從字串的第一個字元開始,或者從最後一個開始,
7,匹配並且替換
echo ${string/23/bb}   //abc1bb42341  替換一次
echo ${string//23/bb}  //abc1bb4bb41  雙斜槓替換所有匹配
echo ${string/#abc/bb} //bb12342341   #以什麼開頭來匹配,根php中的^有點像
echo ${string/%41/bb}  //abc123423bb  %以什麼結尾來匹配,根php中的$有點像

#!/bin/bash
direc=$(pwd)
for file in "$(direc)/*"
do
if [ "${file##*.}" = "sh" ]; then
xterm -e bash $file
elif [ "${file##*.}" = "bin" ]; then
xterm -e $file
elif [ "${file##*.}" = "run" ]; then
xterm -e $file
elif [ "${file##*.}" = "bundle" ]; then
xterm -e $file
elif [ "${file##*.}" = "pl" ]; then
xterm -e perl $file
elif [ "${file##*.}" = "class" ]; then
xterm -e java ${file%.*}
elif [ "${file##*.}" = "rpm" ]; then
xterm -e rpm -ivh $file
elif [ "${file##*.}" = "rb" ]; then
xterm -e ruby $file
elif [ "${file##*.}" = "py" ]; then
xterm -e python $file
elif [ "${file##*.}" = "jar" ]; then
xterm -e java -jar $file
fi
done
OLDIFS=$IFS
IFS=:
for path in $( find $direc -type d -printf "%p$IFS")
do
for file in `ls $path`
do
if [ "${file##*.}" = "sh" ]; then
xterm -e bash """"$path"/"$file""""
elif [ "${file##*.}" = "bin" ]; then
xterm -e """"$path"/"$file""""
elif [ "${file##*.}" = "run" ]; then
xterm -e """"$path"/"$file""""
elif [ "${file##*.}" = "bundle" ]; then
xterm -e """"$path"/"$file""""
elif [ "${file##*.}" = "pl" ]; then
xterm -e perl """"$path"/"$file""""
elif [ "${file##*.}" = "class" ]; then
xterm -e java """"$path"/"${file%.*}""""
elif [ "${file##*.}" = "rpm" ]; then
xterm -e rpm -ivh """"$path"/"$file""""
elif [ "${file##*.}" = "rb" ]; then
xterm -e ruby """"$path"/"$file""""
elif [ "${file##*.}" = "py" ]; then
xterm -e python """"$path"/"$file""""
elif [ "${file##*.}" = "jar" ]; then
xterm -e java -jar """"$path"/"$file""""
fi
done
done
IFS=$OLDIFS

18.複製檔案
#!/bin/sh
cp %%1 %%2

19.複製一個目錄下所有的檔案到另一個目錄
#!/bin/bash
direc="%%1" $(pwd)
for file in "$direc/*"
do
cp "$file" "%%1"
done

20.提取副檔名
#!/bin/sh
%%2=${%%1##.}

21.提取檔名
#!/bin/sh
%%2="$(basename %%1)"

22.提取檔案路徑
#!/bin/sh
%%2="$(dirname %%1)"

23.替換副檔名
#!/bin/sh
%%3="$(basename %%1)$%%2"

24.追加路徑
#!/bin/sh
%%3="$(dirname %%1)/$%%2"

25.移動檔案
#!/bin/sh
mv "%%1" "%%2"

26.移動一個目錄下所有檔案到另一個目錄
#!/bin/bash
direc="%%1" #$(pwd)
OLDIFS=$IFS
IFS=:
for file in "$(direc)/*"
do
mv "$file" "%%1"
done
IFS=$OLDIFS

27.指定目錄下搜尋檔案
#!/bin/sh
find -name "%%1"

28.開啟檔案對話方塊
#!/bin/sh
%%1="$(Xdialog --fselect '~/' 0 0 2>&1)"

29.檔案分割
#!/bin/sh
split -b 2k "%%1"

while read f1 f2 f3
do
    echo $f1 >> f1
    echo $f2 >> f2
    echo $f3 >> f3
done


#!/bin/bash
  linenum=`wc   -l   httperr8007.log|   awk   '{print   $1}'`  
  n1=1  
  file=1  
  while   [   $n1   -lt   $linenum   ]  
  do  
                  n2=`expr   $n1   +   999`  
                  sed   -n   "${n1},   ${n2}p"   httperr8007.log >   file_$file.log    
                  n1=`expr   $n2   +   1`  
                  file=`expr   $file   +   1`  
  done  




其中httperr8007.log為你想分割的大檔案,file_$file.log  為分割後的檔案,最後為file_1.log,file_2.log,file_3.log……,分割完後的每個檔案只有1000行(引數可以自己設定)

split 引數:
-b  :後面可接欲分割成的檔案大小,可加單位,例如 b, k, m 等;
-l  :以行數來進行分割;



#按每個檔案1000行來分割除

split -l 1000 httperr8007.log httperr

httpaa,httpab,httpac ........

#按照每個檔案100K來分割

split -b 100k httperr8007.log http

httpaa,httpab,httpac ........

#!/bin/bash
if [ $# -ne 2 ]; then
echo 'Usage: split file size(in bytes)'
exit
fi

file=$1
size=$2

if [ ! -f $file ]; then
echo "$file doesn't exist"
exit
fi

#TODO: test if $size is a valid integer

filesize=`/bin/ls -l $file | awk '{print $5}'`
echo filesize: $filesize

let pieces=$filesize/$size
let remain=$filesize-$pieces*$size
if [ $remain -gt 0 ]; then
let pieces=$pieces+1
fi
echo pieces: $pieces

i=0
while [ $i -lt $pieces ];
do
echo split: $file.$i:
dd if=$file of=$file.$i bs=$size count=1 skip=$i
let i=$i+1
done

echo "#!/bin/bash" > merge

echo "i=0" >> merge
echo "while [ $i -lt $pieces ];" >> merge
echo "do" >> merge
echo " echo merge: $file.$i" >> merge
echo " if [ ! -f $file.$i ]; then" >> merge
echo " echo merge: $file.$i missed" >> merge
echo " rm -f $file.merged" >> merge
echo " exit" >> merge
echo " fi" >> merge
echo " dd if=$file.$i of=$file.merged bs=$size count=1 seek=$i" >> merge
echo " let i=$i+1" >> merge
echo "done" >> merge
chmod u+x merge'

30.檔案合併
#!/bin/sh
cp "%%1"+"%%2" "%%3"

exec 3<f1
exec 4<f2
while read f1 <&3 && read f2 <&4
do
    echo $f1 $f2 >> join.txt
done

#!/bin/bash
if [ $# -ne 2 ]; then
echo 'Usage: split file size(in bytes)'
exit
fi

file=$1
size=$2

if [ ! -f $file ]; then
echo "$file doesn't exist"
exit
fi

#TODO: test if $size is a valid integer

filesize=`/bin/ls -l $file | awk '{print $5}'`
echo filesize: $filesize

let pieces=$filesize/$size
let remain=$filesize-$pieces*$size
if [ $remain -gt 0 ]; then
let pieces=$pieces+1
fi
echo pieces: $pieces

i=0
while [ $i -lt $pieces ];
do
echo split: $file.$i:
dd if=$file of=$file.$i bs=$size count=1 skip=$i
let i=$i+1
done

echo "#!/bin/bash" > merge

echo "i=0" >> merge
echo "while [ $i -lt $pieces ];" >> merge
echo "do" >> merge
echo " echo merge: $file.$i" >> merge
echo " if [ ! -f $file.$i ]; then" >> merge
echo " echo merge: $file.$i missed" >> merge
echo " rm -f $file.merged" >> merge
echo " exit" >> merge
echo " fi" >> merge
echo " dd if=$file.$i of=$file.merged bs=$size count=1 seek=$i" >> merge
echo " let i=$i+1" >> merge
echo "done" >> merge
chmod u+x merge'

31.檔案簡單加密
#!/bin/bash
#make test && make strings && sudo make install
shc -r -f %%1.sh
#%%1.x
#%%1.x.c

32.檔案簡單解密
#!/bin/bash
#make test && make strings && sudo make install
shc -r -f %%1.sh
#%%1.x
#%%1.x.c

33.讀取ini檔案屬性
#!/bin/bash
if [ "$%%3" = "" ];then
   sed -n "/\[$%%2\]/,/\[.*\]/{
   /^\[.*\]/d
   /^[ ]*$/d
   s/;.*$//
   p
   }" $1
elif [ "$%%4" = "" ];then
   sed -n "/\[$%%2\]/,/\[.*\]/{
   /^\[.*\]/d
   /^[ ]*$/d
   s/;.*$//
   s/^[ |        ]*$%%3[ | ]*=[ |   ]*\(.*\)[ |     ]*/\1/p
   }" $1
else
       if [ "$%%4" = "#" ];then
            sed "/\[$%%2\]/,/\[.*\]/{
            s/^[ |        ]*$%%3[ |    ]*=.*/ /
            }p" $1 > /tmp/sed$$
            mv /tmp/sed$$ $1
       else
            sed "/\[$2\]/,/\[.*\]/{
            s/^[ |        ]*$%%3[ |    ]*=.*/$%%3=$%%4/
            }p" $1 > /tmp/sed$$
            mv /tmp/sed$$ $%%1
       fi
fi

34.合併一個檔案下所有的檔案
#!/bin/sh
cat $(ls |grep -E '%%1\.') > %%1

#!/bin/bash
OLDIFS=$IFS
IFS=:
for path in $( find %%1 -type d -printf "%p$IFS")
do
for file in $path/*.c $path/*.cpp
do
if [[ ! "$file" =~ \*.[A-Za-z]+ ]]; then
#"$(path)/$(file)"
fi
done
done
IFS=$OLDIFS

#!/bin/bash
cat <<'EOF'> combine.c
#include<stdio.h>
int main()
{
FILE *f1,*f2,*f3;
f1=fopen("a1.txt","r");
f2=fopen("a2.txt","r");
f3=fopen("a3.txt","w");
int a,b;
a=getw(f1);   /*從a1.txt和a2.txt中分別取最小的數a和b*/
b=getw(f2);
while(!feof(f1)&&!feof(f2))  /*兩個檔案都沒結束時,執行迴圈、比較*/
{
if(a<=b)
{
putw(a,f3);
a=getw(f1);
}
else
{putw(b,f3);
b=getw(f2);
}
   }
if(feof(f1))  /*檔案a1.txt結束時,把a2.txt中的數全部輸入a3.txt*/
{putw(b,f3);
while((b=getw(f2))!=EOF)
putw(b,f3);
}
if(feof(f2))   /*同上*/
{
putw(a,f3);
while((a=getw(f1))!=EOF)
putw(a,f3);
}
fclose(f1);
fclose(f2);
fclose(f3);
printf("已完成!");
return 0;
}
EOF
gcc -o combine combine.c
if [ $? -eq 0 ]; then
./combine
else
echo 'Compile ERROR'
fi

35.寫入ini檔案屬性
#!/bin/bash
if [ "$%%3" = "" ];then
   sed -n "/\[$%%2\]/,/\[.*\]/{
   /^\[.*\]/d
   /^[ ]*$/d
   s/;.*$//
   p
   }" $1
elif [ "$%%4" = "" ];then
   sed -n "/\[$%%2\]/,/\[.*\]/{
   /^\[.*\]/d
   /^[ ]*$/d
   s/;.*$//
   s/^[ |        ]*$%%3[ | ]*=[ |   ]*\(.*\)[ |     ]*/\1/p
   }" $1
else
       if [ "$%%4" = "#" ];then
            sed "/\[$%%2\]/,/\[.*\]/{
            s/^[ |        ]*$%%3[ |    ]*=.*/ /
            }p" $1 > /tmp/sed$$
            mv /tmp/sed$$ $%%1
       else
            sed "/\[$%%2\]/,/\[.*\]/{
            s/^[ |        ]*$%%3[ |    ]*=.*/$%%3=$%%4/
            }p" $1 > /tmp/sed$$
            mv /tmp/sed$$ $%%1
       fi
fi

36.獲得當前路徑
#!/bin/sh
%%1=$(pwd)

37.讀取XML資料庫

如何通過shell命令列讀取xml檔案中某個屬性所對應的值?
例如:
<key>BuildVersion</key> <string>5</string>
我希望能夠通過Unix shell命令對屬性鍵的名稱BuildVersion進行查詢,返回的結果是5,如何實現呀?
#!/bin/bash
grep BuildVersion|sed 's/.*<.*>\([^<].*\)<.*>.*/\1/'

結果返回的是“BuildVersion”,而不是“5”,如果要查詢BuildVersion自動返回數值5應當如何寫?

應該沒錯的。試一下: echo "<key>BuildVersion</key> <string>5</string>"|grep BuildVersion|sed 's/.*<.*>\([^<].*\)<.*>.*/\1/'我在SL的終端裡試,返回值是5

目前需要從xml檔案提取資料,想做一個xmlparser.sh
xml 類似這樣
<result>
   <shareinfo hostip="192.168.0.1" sharename="abcd" password="abc123"></shareinfo>
</result>


希望輸入 xmlparser.sh a.xml hostip可以返回192.168.0.1


#!/bin/sh

if [ $# -ne 2 ];then
   echo "Usage: $0 <xmlfile> <key>"
   exit 0
fi

grep $2 $1|awk '{print $2}'|grep -o "[0-9.]*"



grep $2 $1|awk '{print $2}'|grep -o "[0-9.]*"
改成
grep $2 $1|awk '{print $2}'|grep -Eo "[0-9.]+"
樓上這個有問題,如果我要得到的是
<result>
   <shareinfo hostip="192.168.0.1" sharename="abcd" password="abc123"></shareinfo>
</result>
中的sharename,那麼,呵呵,就錯了

我覺得應該先定位到第二個引數“$2”的位置,然後再提取“=”後面的內容

這裡有個完整的實現:
Parse Simple XML Files using Bash – Extract Name Value Pairs and Attributes
http://www.humbug.in/2010/parse-simple-xml-files-using-bash-extract-name-value-pairs-and-attributes/


不過需要安裝xmllint.

設計到對多個xml檔案進行element的讀取和列表。有人做過麼?
舉個例子,
多個xml檔案裡面都有
<article>
        <title>xxx</titlel>
</article>

通過shell讀取,然後合併到一起,再生成一個新的xml,但是其他元素不變。
<article>
        <title>aaa</titlel>
</article>
<article>
        <title>bbb</titlel>
</article>

如果格式異常簡單,沒有特例,那麼可以用shell實現
如果有可能格式複雜,因為shell的命令所使用的正則表示式都不支援跨行匹配,所以用shell來解決這個問題就繞圈子了。
用perl來作這個工作最直接、簡單。perl的XML:DOM模組是專門處理XML檔案的。

偶倒是覺得,用PHP寫Scripts也很方便,功能強大,而且,跨平臺,

#!/bin/sh



sed -n '/<article>/{

N;

/\n[[:space:]]*<title>/{

    N;

    /<article>.*<\/article>/p

    }

D;

n

}'


這小段程式碼能把一個xml檔案中,你要的東西拿出來.
你可以用for file in $*把這些資訊都>>tmpfile中.
然後用sed 在指定檔案的指定位置用r命令把tmpfile貼上進來~~~~

大思路如此^_^  我想有這個東西(只要能正確的跑出結果)後面就不難了吧...

Name
xmllint — command line XML tool

Synopsis
xmllint [[--version] | [--debug] | [--shell] | [--debugent] | [--copy] | [--recover] | [--noent] | [--noout] | [--nonet] | [--htmlout] | [--nowrap] | [--valid] | [--postvalid] | [--dtdvalid URL] | [--dtdvalidfpi FPI] | [--timing] | [--output file] | [--repeat] | [--insert] | [--compress] | [--html] | [--xmlout] | [--push] | [--memory] | [--maxmem nbbytes] | [--nowarning] | [--noblanks] | [--nocdata] | [--format] | [--encode encoding] | [--dropdtd] | [--nsclean] | [--testIO] | [--catalogs] | [--nocatalogs] | [--auto] | [--xinclude] | [--noxincludenode] | [--loaddtd] | [--dtdattr] | [--stream] | [--walker] | [--pattern patternvalue] | [--chkregister] | [--relaxng] | [--schema] | [--c14n]] [xmlfile]

Introduction
The xmllint program parses one or more XML files, specified on the command line as xmlfile. It prints various types of output, depending upon the options selected. It is useful for detecting errors both in XML code and in the XML parser itself.

It is included in libxml2.

Options
--version
Display the version of libxml2 used.
--debug
Parse a file and output an annotated tree of the in-memory version of the document.
--shell
Run a navigating shell. Details on available commands in shell mode are below.
--debugent
Debug the entities defined in the document.
--copy
Test the internal copy implementation.
--recover
Output any parsable portions of an invalid document.
--noent
Substitute entity values for entity references. By default, xmllint leaves entity references in place.
--nocdata
Substitute CDATA section by equivalent text nodes.
--nsclean
Remove redundant namespace declarations.
--noout
Suppress output. By default, xmllint outputs the result tree.
--htmlout
Output results as an HTML file. This causes xmllint to output the necessary HTML tags surrounding the result tree output so the results can be displayed in a browser.
--nowrap
Do not output HTML doc wrapper.
--valid
Determine if the document is a valid instance of the included Document Type Definition (DTD). A DTD to be validated against also can be specified at the command line using the --dtdvalid option. By default, xmllint also checks to determine if the document is well-formed.
--postvalid
Validate after parsing is completed.
--dtdvalid URL
Use the DTD specified by URL for validation.
--dtdvalidfpi FPI
Use the DTD specified by the Public Identifier FPI for validation, note that this will require a Catalog exporting that Public Identifier to work.
--timing
Output information about the time it takes xmllint to perform the various steps.
--output file
Define a file path where xmllint will save the result of parsing. Usually the programs build a tree and save it on stdout, with this option the result XML instance will be saved onto a file.
--repeat
Repeat 100 times, for timing or profiling.
--insert
Test for valid insertions.
--compress
Turn on gzip compression of output.
--html
Use the HTML parser.
--xmlout
Used in conjunction with --html. Usually when HTML is parsed the document is saved with the HTML serializer, but with this option the resulting document is saved with the XML serializer. This is primarily used to generate XHTML from HTML input.
--push
Use the push mode of the parser.
--memory
Parse from memory.
--maxmem nnbytes
Test the parser memory support. nnbytes is the maximum number of bytes the library is allowed to allocate. This can also be used to make sure batch processing of XML files will not exhaust the virtual memory of the server running them.
--nowarning
Do not emit warnings from the parser and/or validator.
--noblanks
Drop ignorable blank spaces.
--format
Reformat and reindent the output. The $XMLLINT_INDENT environment variable controls the indentation (default value is two spaces " ").
--testIO
Test user input/output support.
--encode encoding
Output in the given encoding.
--catalogs
Use the catalogs from $SGML_CATALOG_FILES. Otherwise /etc/xml/catalog is used by default.
--nocatalogs
Do not use any catalogs.
--auto
Generate a small document for testing purposes.
--xinclude
Do XInclude processing.
--noxincludenode
Do XInclude processing but do not generate XInclude start and end nodes.
--loaddtd
Fetch external DTD.
--dtdattr
Fetch external DTD and populate the tree with inherited attributes.
--dropdtd
Remove DTD from output.
--stream
Use streaming API - useful when used in combination with --relaxng or --valid options for validation of files that are too large to be held in memory.
--walker
Test the walker module, which is a reader interface but for a document tree, instead of using the reader API on an unparsed document it works on a existing in-memory tree. Used in debugging.
--chkregister
Turn on node registration. Useful for developers testing libxml2 node tracking code.
--pattern patternvalue
Used to exercise the pattern recognition engine, which can be used with the reader interface to the parser. It allows to select some nodes in the document based on an XPath (subset) expression. Used for debugging.
--relaxng schema
Use RelaxNG file named schema for validation.
--schema schema
Use a W3C XML Schema file named schema for validation.
--c14n
Use the W3C XML Canonicalisation (C14N) to serialize the result of parsing to stdout. It keeps comments in the result.
Shell
xmllint offers an interactive shell mode invoked with the --shell command. Available commands in shell mode include:

base
display XML base of the node
bye
leave shell
cat node
Display node if given or current node.
cd path
Change the current node to path (if given and unique) or root if no argument given.
dir path
Dumps information about the node (namespace, attributes, content).
du path
Show the structure of the subtree under path or the current node.
exit
Leave the shell.
help
Show this help.
free
Display memory usage.
load name
Load a new document with the given name.
ls path
List contents of path (if given) or the current directory.
pwd
Display the path to the current node.
quit
Leave the shell.
save name
Saves the current document to name if given or to the original name.
validate
Check the document for error.
write name
Write the current node to the given filename.
Catalogs
Catalog behavior can be changed by redirecting queries to the user's own set of catalogs. This can be done by setting the XML_CATALOG_FILES environment variable to a list of catalogs. An empty one should deactivate loading the default /etc/xml/catalog default catalog.

Debugging Catalogs
Setting the environment variable XML_DEBUG_CATALOG using the command "export XML_DEBUG_CATALOG=" outputs debugging information related to catalog operations.

Error Return Codes
On the completion of execution, Xmllint returns the following error codes:

0
No error
1
Unclassified
2
Error in DTD
3
Validation error
4
Validation error
5
Error in schema compilation
6
Error writing output
7
Error in pattern (generated when [--pattern] option is used)
8
Error in Reader registration (generated when [--chkregister] option is used)
9
Out of memory error

Parse Simple XML Files using Bash – Extract Name Value Pairs and Attributes


2 Comments
1
Tweet




Pratik Sinha | July 31, 2010


I have written up a simple routine par***ML to parse simple XML files to extract unique name values pairs and their attributes. The script extracts all xml tags of the format <abc arg1="hello">xyz</abc> and dynamically creates bash variables which hold values of the attributes as well as the elements. This is a good solution, if you don’t wish to use xpath for some simple xml files. However you will need xmllint installed on your system to use the script. Here’s a sample script which uses the par***ML function
#!/bin/bash
xmlFile=$1

function par***ML() {
  elemList=( $(cat $xmlFile | tr '\n' ' ' | XMLLINT_INDENT="" xmllint --format - | /bin/grep -e "</.*>$" | while read line; do \
    echo $line | sed -e 's/^.*<\///' | cut -d '>' -f 1; \
  done) )

  totalNoOfTags=${#elemList[@]}; ((totalNoOfTags--))
  suffix=$(echo ${elemList[$totalNoOfTags]} | tr -d '</>')
  suffix="${suffix}_"

  for (( i = 0 ; i < ${#elemList[@]} ; i++ )); do
    elem=${elemList[$i]}
    elemLine=$(cat $xmlFile | tr '\n' ' ' | XMLLINT_INDENT="" xmllint --format - | /bin/grep "</$elem>")
    echo $elemLine | grep -e "^</[^ ]*>$" 1>/dev/null 2>&1
    if [ "0" = "$?" ]; then
      continue
    fi
    elemVal=$(echo $elemLine | tr '\011' '\040'| sed -e 's/^[ ]*//' -e 's/^<.*>\([^<].*\)<.*>$/\1/' | sed -e 's/^[ ]*//' | sed -e 's/[ ]*$//')
    xmlElem="${suffix}$(echo $elem | sed 's/-/_/g')"
    eval ${xmlElem}=`echo -ne \""${elemVal}"\"`
    attrList=($(cat $xmlFile | tr '\n' ' ' | XMLLINT_INDENT="" xmllint --format - | /bin/grep "</$elem>" | tr '\011' '\040' | sed -e 's/^[ ]*//' | cut -d '>' -f 1  | sed -e 's/^<[^ ]*//' | tr "'" '"' | tr '"' '\n'  | tr '=' '\n' | sed -e 's/^[ ]*//' | sed '/^$/d' | tr '\011' '\040' | tr ' ' '>'))
    for (( j = 0 ; j < ${#attrList[@]} ; j++ )); do
      attr=${attrList[$j]}
      ((j++))
      attrVal=$(echo ${attrList[$j]} | tr '>' ' ')
      attrName=`echo -ne ${xmlElem}_${attr}`
      eval ${attrName}=`echo -ne \""${attrVal}"\"`
    done
  done
}

par***ML
echo "$status_xyz |  $status_abc |  $status_pqr" #Variables for each  XML ELement
echo "$status_xyz_arg1 |  $status_abc_arg2 |  $status_pqr_arg3 | $status_pqr_arg4" #Variables for each XML Attribute
echo ""

#All the variables that were produced by the par***ML function
set | /bin/grep -e "^$suffix"

The XML File used for the above script example is:
<?xml version="1.0"?>
<status>
  <xyz arg1="1"> a </xyz>
  <abc arg2="2"> p </abc>
  <pqr arg3="3" arg4="a phrase"> x </pqr>
</status>


The root tag, which in this case is “status”, is used as a suffix for all variables. Once the XML file is passed to the function, it dynamically creates the variables $status_xyz, $status_abc, $status_pqr, $status_xyz_arg1, $status_abc_arg2, $status_pqr_arg3 and $status_pqr_arg4.

The output when the script is ran with the xml file as an argument is
@$ bash  par***ML.sh test.xml
a |  p |  x
1 |  2 |  3 | a phrase

status_abc=p
status_abc_arg2=2
status_pqr=x
status_pqr_arg3=3
status_pqr_arg4='a phrase'
status_xyz=a
status_xyz_arg1=1

This script won’t work for XML files like the one below with duplicate element names.
<?xml version="1.0"?>
<status>
  <test arg1="1"> a </test>
  <test arg2="2"> p </test>
  <test arg3="3" arg4="a phrase"> x </test>
</status>


This script also won’t be able to extract attributes of elements without any CDATA. For eg, the script won’t be able to create variables corresponding to <test arg1="1">. It will only create the variables corresponding to <test1 arg2="2">abc</test1>.
<?xml version="1.0"?>
<status>
  <test arg1="1">
    <test1 arg2="2">abc</test1>
  </test>
</status>

38.寫入XML資料庫
#!/bin/bash

39.ZIP壓縮檔案
#!/bin/sh
zip -r "/%%1" "%%2"

40.ZIP解壓縮
#!/bin/sh
unzip -x "/%%1" "%%2"

41.獲得應用程式完整路徑
#!/bin/bash

42.ZIP壓縮資料夾
#!/bin/bash

43.遞迴刪除目錄下的檔案
#!/bin/bash
rm -if "%%1/*"
OLDIFS=$IFS
IFS=:
for path in $( find %%1 -type d -printf "%p$IFS")
do
for file in $path/*.c $path/*.cpp
do
if [[ ! "$file" =~ \*.[A-Za-z]+ ]]; then
#"$(path)/$(file)"
fi
done
done
IFS=$OLDIFS

44.IDEA加密演算法
#!/bin/bash

45.RC6演算法
#!/bin/bash
cat <<'EOF'> rc6.c
#include<stdio.h>
/* Timing data for RC6 (rc6.c)

128 bit key:
Key Setup:    1632 cycles
Encrypt:       270 cycles =    94.8 mbits/sec
Decrypt:       226 cycles =   113.3 mbits/sec
Mean:          248 cycles =   103.2 mbits/sec

192 bit key:
Key Setup:    1885 cycles
Encrypt:       267 cycles =    95.9 mbits/sec
Decrypt:       235 cycles =   108.9 mbits/sec
Mean:          251 cycles =   102.0 mbits/sec

256 bit key:
Key Setup:    1877 cycles
Encrypt:       270 cycles =    94.8 mbits/sec
Decrypt:       227 cycles =   112.8 mbits/sec
Mean:          249 cycles =   103.0 mbits/sec

*/

#include "../std_defs.h"

static char *alg_name[] = { "rc6", "rc6.c", "rc6" };

char **cipher_name()
{
    return alg_name;
}

#define f_rnd(i,a,b,c,d)                    \
        u = rotl(d * (d + d + 1), 5);       \
        t = rotl(b * (b + b + 1), 5);       \
        a = rotl(a ^ t, u) + l_key;      \
        c = rotl(c ^ u, t) + l_key[i + 1]

#define i_rnd(i,a,b,c,d)                    \
        u = rotl(d * (d + d + 1), 5);       \
        t = rotl(b * (b + b + 1), 5);       \
        c = rotr(c - l_key[i + 1], t) ^ u;  \
        a = rotr(a - l_key, u) ^ t

u4byte  l_key[44];  /* storage for the key schedule         */

/* initialise the key schedule from the user supplied key   */

u4byte *set_key(const u4byte in_key[], const u4byte key_len)
{   u4byte  i, j, k, a, b, l[8], t;

    l_key[0] = 0xb7e15163;

    for(k = 1; k < 44; ++k)
       
        l_key[k] = l_key[k - 1] + 0x9e3779b9;

    for(k = 0; k < key_len / 32; ++k)

        l[k] = in_key[k];

    t = (key_len / 32) - 1; // t = (key_len / 32);

    a = b = i = j = 0;

    for(k = 0; k < 132; ++k)
    {   a = rotl(l_key + a + b, 3); b += a;
        b = rotl(l[j] + b, b);
        l_key = a; l[j] = b;
        i = (i == 43 ? 0 : i + 1); // i = (i + 1) % 44; 
        j = (j == t ? 0 : j + 1);  // j = (j + 1) % t;
    }

    return l_key;
};

/* encrypt a block of text  */

void encrypt(const u4byte in_blk[4], u4byte out_blk[4])
{   u4byte  a,b,c,d,t,u;

    a = in_blk[0]; b = in_blk[1] + l_key[0];
    c = in_blk[2]; d = in_blk[3] + l_key[1];

    f_rnd( 2,a,b,c,d); f_rnd( 4,b,c,d,a);
    f_rnd( 6,c,d,a,b); f_rnd( 8,d,a,b,c);
    f_rnd(10,a,b,c,d); f_rnd(12,b,c,d,a);
    f_rnd(14,c,d,a,b); f_rnd(16,d,a,b,c);
    f_rnd(18,a,b,c,d); f_rnd(20,b,c,d,a);
    f_rnd(22,c,d,a,b); f_rnd(24,d,a,b,c);
    f_rnd(26,a,b,c,d); f_rnd(28,b,c,d,a);
    f_rnd(30,c,d,a,b); f_rnd(32,d,a,b,c);
    f_rnd(34,a,b,c,d); f_rnd(36,b,c,d,a);
    f_rnd(38,c,d,a,b); f_rnd(40,d,a,b,c);

    out_blk[0] = a + l_key[42]; out_blk[1] = b;
    out_blk[2] = c + l_key[43]; out_blk[3] = d;
};

/* decrypt a block of text  */

void decrypt(const u4byte in_blk[4], u4byte out_blk[4])
{   u4byte  a,b,c,d,t,u;

    d = in_blk[3]; c = in_blk[2] - l_key[43];
    b = in_blk[1]; a = in_blk[0] - l_key[42];

    i_rnd(40,d,a,b,c); i_rnd(38,c,d,a,b);
    i_rnd(36,b,c,d,a); i_rnd(34,a,b,c,d);
    i_rnd(32,d,a,b,c); i_rnd(30,c,d,a,b);
    i_rnd(28,b,c,d,a); i_rnd(26,a,b,c,d);
    i_rnd(24,d,a,b,c); i_rnd(22,c,d,a,b);
    i_rnd(20,b,c,d,a); i_rnd(18,a,b,c,d);
    i_rnd(16,d,a,b,c); i_rnd(14,c,d,a,b);
    i_rnd(12,b,c,d,a); i_rnd(10,a,b,c,d);
    i_rnd( 8,d,a,b,c); i_rnd( 6,c,d,a,b);
    i_rnd( 4,b,c,d,a); i_rnd( 2,a,b,c,d);

    out_blk[3] = d - l_key[1]; out_blk[2] = c;
    out_blk[1] = b - l_key[0]; out_blk[0] = a;
};
int main()
{

return 0;
}
EOF
gcc -o rc6 rc6.c
if [ $? -eq 0 ]; then
./combine
else
echo 'Compile ERROR'
fi

46.Grep
#!/bin/bash
grep -qE %%1 %%2

47.直接建立多級目錄
#!/bin/bash
mkdir -p %%1

48.批量重新命名
#!/bin/bash
find $PWD -type f -name '*\.cpp' |sed s/'\.cpp'//g|awk '{MV = "mv"};{C = "\.c"};{ CPP="\.cpp"}; {print MV, $1 CPP , $1 C}'|sh
ls | awk -F '-' '{print "mv "$0" "$2}' #去掉帶'-'的字首

49.文字查詢替換
#!/bin/bash
sed -e 's:%%2:%%3:g' %%1
#sed -e 's/%%2/%%3/g' %%1

50.檔案關聯
#!/bin/bash

51.批量轉換編碼從GB2312到Unicode
#!/bin/bash
scode="gbk"
dcode="ucs2"
for FILE in $(find $(pwd) -type f)
do
TMP_file=$(mktemp -p $(pwd))
if [ -f $FILE ]; then
Fright=$(stat -c %a $FILE)
Fuser=$(stat -c %U $FILE)
Fgrp=$(stat -c %G $FILE)
iconv -f $scode -t $dcode $FILE -o $TMP_file
mv $TMP_file $FILE
chmod $Fright $FILE
chown $Fuser.$Fgrp $FILE
fi
done

52.設定JDK環境變數
#!/bin/bash
find "$PWD" -type f \( -iname '*.bin' \) -print0 | xargs -0 chmod +x
find -type f \( -iname '*.bin' \) -print |
while read filename
do
    case "$filename" in
    *.bin)
        xterm -e "$filename" && rm -if "$filename"
        ;;
    esac
done
OLDIFS=$IFS
IFS=$'\n'
for line in `cat ~/.bashrc`
do
if [[ "$line" =~ .*export.* ]]; then
    if [[ "$line" =~ .*JAVA_HOME=.* ]]; then
      if [[ "$line" =~ =(\/([0-9a-zA-Z._]+))+ ]]; then
       javahome=$line
      fi
    fi
fi
if [[ "$line" =~ export\ PATH=\$PATH:\$JAVA_HOME/bin:\$JAVA_HOME/jre/bin$ ]];then
    javapath=$line
fi
if [[ "$line" =~ export\ CLASSPATH=.:\$JAVA_HOME/lib:\$JAVA_HOME/jre/lib$ ]];then
    classpath=$line
fi
done
if [ ! -n "$javahome" ]; then
sed -i '$a export JAVA_HOME='$(pwd)'/jdk1.6.0_25' ~/.bashrc
else
sed -i 's:'${javahome//\\/\\\\}':export JAVA_HOME='$(pwd)'/jdk1.6.0_32:g' ~/.bashrc
fi
if [ ! -n "$javapath" ]; then
sed -i '$a export PATH=$PATH:$JAVA_HOME/bin:$JAVA_HOME/jre/bin' ~/.bashrc
fi
if [ ! -n "$classpath" ]; then
sed -i '$a export CLASSPATH=.:$JAVA_HOME/lib:$JAVA_HOME/jre/lib' ~/.bashrc
fi
IFS=$OLDIFS

#!/bin/bash
shift
OLDIFS=$IFS
IFS=$'\n'
for line in `cat ~/TestBash.txt` #~/.bashrc
do
  if [[ "$line" =~ .*export.* ]]; then
    if [[ "$line" =~ export\ CLASSPATH=.:\$JAVA_HOME/lib:\$JAVA_HOME/jre/lib$ ]]; then
      classpath=$line
    elif [[ "$line" =~ export\ PATH=\$PATH:\$CATALINA_HOME/bin$ ]]; then
      jbosspath=$line
fi
    if [[ "$line" =~ .*JAVA_HOME=.* ]]; then
      if [[ "$line" =~ =(\/([0-9a-zA-Z._]+))+ ]];then
       javahome=$line
      fi
    elif [[ "$line" =~ .*CATALINA_HOME=.* ]];then
      if [[ "$line" =~ =(\/([0-9a-zA-Z._]+))+ ]];then
       catalinahome=$line
      fi
    elif [[ "$line" =~ .*TOMCAT_HOME=.* ]];then
      if [[ "$line" =~ =(\/([0-9a-zA-Z._]+))+ ]];then
       tomcathome=$line
      fi
    elif [[ "$line" =~ .*CATALINA_BASE=.* ]];then
      if [[ "$line" =~ =(\/([0-9a-zA-Z._]+))+ ]];then
       catalinabase=$line
      fi
    elif [[ "$line" =~ .*JBOSS_HOME=.* ]];then
      if [[ "$line" =~ =(\/([0-9a-zA-Z._]+))+ ]];then
       jbosshome=$line
      fi
    fi
  elif [[ "$line" =~ ^PATH=\$PATH:\$JAVA_HOME/bin:\$JAVA_HOME/jre/bin$ ]];then
    javapath=$line
  fi
  if [[ "$line" =~ export\ CLASSPATH=.:\$JAVA_HOME/lib:\$JAVA_HOME/jre/lib$ ]];then
    classpath=$line
  fi
  if [[ "$line" =~ export\ PATH=\$PATH:\$JBOSS_HOME/bin$ ]];then
    jbosspath=$line
  fi
done
if [ ! -n "$javahome" ]; then
sed -i '$a export JAVA_HOME='$(pwd)'/jdk1.6.0_24' ~/TestBash.txt #~/.bashrc
else
sed -i 's:'${javahome//\\/\\\\}':export JAVA_HOME='$(pwd)'/jdk1.6.0_24:g' ~/TestBash.txt
fi
if [ ! -n "$javapath" ]; then
sed -i '$a PATH=$PATH:$JAVA_HOME/bin:$JAVA_HOME/jre/bin' ~/TestBash.txt #~/.bashrc
fi
if [ ! -n "$classpath" ]; then
sed -i '$a export CLASSPATH=.:$JAVA_HOME/lib:$JAVA_HOME/jre/lib' ~/TestBash.txt #~/.bashrc
fi
if [ ! -n "$catalinahome" ]; then
sed -i '$a export CATALINA_HOME='$(pwd) ~/TestBash.txt #~/.bashrc
else
sed -i 's:'${catalinahome//\\/\\\\}':export CATALINA_HOME='$(pwd)':g' ~/TestBash.txt
fi
if [ ! -n "$tomcathome" ]; then
sed -i '$a export TOMCAT_HOME='$(pwd) ~/TestBash.txt #~/.bashrc
else
sed -i 's:'${tomcathome//\\/\\\\}':export TOMCAT_HOME='$(pwd)':g' ~/TestBash.txt
fi
if [ ! -n "$catalinabase" ]; then
sed -i '$a export CATALINA_BASE='$(pwd) ~/TestBash.txt #~/.bashrc
else
sed -i 's:'${catalinabase//\\/\\\\}':export CATALINA_BASE='$(pwd)':g' ~/TestBash.txt
fi
if [ ! -n "$jbosshome" ]; then
sed -i '$a export JBOSS_HOME='$(pwd) ~/TestBash.txt #~/.bashrc
else
sed -i 's:'${jbosshome//\\/\\\\}':export JBOSS_HOME='$(pwd)':g' ~/TestBash.txt
fi
if [ ! -n "$jbosspath" ]; then
sed -i '$a export PATH=$PATH:$CATALINA_HOME/bin' ~/TestBash.txt #~/.bashrc
fi
IFS=$OLDIFS

53.批量轉換編碼從Unicode到GB2312
#!/bin/bash
scode="ucs2"
dcode="gbk"
for FILE in $(find $(pwd) -type f)
do
TMP_file=$(mktemp -p $(pwd))
if [ -f $FILE ]; then
Fright=$(stat -c %a $FILE)
Fuser=$(stat -c %U $FILE)
Fgrp=$(stat -c %G $FILE)
iconv -f $scode -t $dcode $FILE -o $TMP_file
mv $TMP_file $FILE
chmod $Fright $FILE
chown $Fuser.$Fgrp $FILE
fi
done

54.刪除空資料夾
#!/bin/bash
rmdir -p %%1

55.GB2312檔案轉UTF-8格式
#!/bin/bash
iconv -f gbk -t utf8 %%1 -o %%2

56.UTF-8檔案轉GB2312格式
#!/bin/bash
iconv -f utf8 -t  gbk %%1 -o %%2

57.獲取檔案路徑的父路徑
#!/bin/bash
%%1=basename $PWD

58.Unicode檔案轉UTF-8格式
#!/bin/bash
iconv -f ucs2 -t  utf-8 %%1 -o %%2

59.CRC迴圈冗餘校驗
#!/bin/bash
cat <<'EOF'> crc.c
#include<stdio.h>

unsigned long int crc32_table[256]; 

unsigned long int ulPolynomial = 0x04c11db7; 

unsigned long int Reflect(unsigned long int ref, char ch) 

  {     unsigned long int value(0); 

        // 交換bit0和bit7,bit1和bit6,類推 

        for(int i = 1; i < (ch + 1); i++) 

         {            if(ref & 1) 

                      value |= 1 << (ch - i); 

                   ref >>= 1;      } 

        return value; 



init_crc32_table() 

  {     unsigned long int crc,temp; 

        // 256個值 

        for(int i = 0; i <= 0xFF; i++) 

         {   temp=Reflect(i, 8); 

               crc32_table[i]= temp<< 24; 

                for (int j = 0; j < 8; j++){ 

             unsigned long int t1,t2; 

  unsigned long int flag=crc32_table[i]&0x80000000; 

                t1=(crc32_table[i] << 1); 

                if(flag==0) 

                  t2=0; 

                else 

                  t2=ulPolynomial; 

                crc32_table[i] =t1^t2 ;        } 

               crc=crc32_table[i]; 

               crc32_table[i] = Reflect(crc32_table[i], 32); 
        }
}
unsigned long GenerateCRC32(char xdata * DataBuf,unsigned long  len) 

  { 

        unsigned long oldcrc32; 

        unsigned long crc32; 

        unsigned long oldcrc; 

        unsigned  int charcnt; 

         char c,t; 

        oldcrc32 = 0x00000000; //初值為0 

     charcnt=0; 

         while (len--) { 

                 t= (oldcrc32 >> 24) & 0xFF;   //要移出的位元組的值 

     oldcrc=crc_32_tab[t];         //根據移出的位元組的值查表 

                 c=DataBuf[charcnt];          //新移進來的位元組值 

                 oldcrc32= (oldcrc32 << 8) | c;   //將新移進來的位元組值添在暫存器末位元組中 

                 oldcrc32=oldcrc32^oldcrc;     //將暫存器與查出的值進行xor運算 

                 charcnt++; 

        } 

         crc32=oldcrc32; 

         return crc32; 



引數表可以先在PC機上算出來,也可在程式初始化時完成。下面是用於計算引數表的c語言子程式,在Visual C++ 6.0下編譯通過。 

#include <stdio.h> 

unsigned long int crc32_table[256]; 

unsigned long int ulPolynomial = 0x04c11db7; 

unsigned long int Reflect(unsigned long int ref, char ch) 

  {     unsigned long int value(0); 

        // 交換bit0和bit7,bit1和bit6,類推 

        for(int i = 1; i < (ch + 1); i++) 

         {            if(ref & 1) 

                      value |= 1 << (ch - i); 

                   ref >>= 1;      } 

        return value; 

}
int main()
{
     unsigned long int crc,temp; 

        // 256個值 

        for(int i = 0; i <= 0xFF; i++) 

         {
temp=Reflect(i, 8);
               crc32_table[i]= temp<< 24; 

                for (int j = 0; j < 8; j++){ 

             unsigned long int t1,t2; 

  unsigned long int flag=crc32_table[i]&0x80000000;
                t1=(crc32_table[i] << 1); 

                if(flag==0) 

                  t2=0; 

                else 

                  t2=ulPolynomial; 

                crc32_table[i] =t1^t2 ;       


               crc=crc32_table[i];
               crc32_table[i] = Reflect(crc32_table[i], 32);
        }
return 0;
}
EOF
gcc -o crc crc.c
if [ $? -eq 0 ]; then
./combine
else
echo 'Compile ERROR'
fi

60.判斷是否為空檔案
#!/bin/bash

61.終止程式
#!/bin/sh
kill -KILL pidof %%1 -s
#killall %%1

62.定時關機
#!/bin/sh
shutdown -h %%1 & #23:00
#shutdown -h now
#halt
#/sbin/poweroff
#init 0

63.顯示程序列表
#!/bin/sh
ps aux
#fuser -l

64.遍歷資料夾列出檔案大小
#!/bin/sh
du -sH "%%1/*"

65.GOST演算法
#!/bin/bash

66.對目標壓縮檔案解壓縮到指定資料夾
#!/bin/bash

67.儲存檔案時重名自動生成新檔案
#!/bin/bash

68.開啟網頁
#!/bin/sh
lynx %%1

69.刪除空資料夾整合操作
#!/bin/bash

70.獲取磁碟所有分割槽
#!/bin/sh
df -k

71.啟用一個程式或程式關聯的檔案
#!/bin/bash

72.MP3播放
#!/bin/sh
amp "%%1"

73.WAV播放
#!/bin/sh
amp "%%1"

74.寫影象到剪下板
#!/bin/bash

75.從剪貼簿複製影象到窗體
#!/bin/bash

76.刪除資料夾下的所有檔案且不刪除資料夾下的資料夾
#!/bin/sh
rm -if "%%1/*"

77.XML遍歷結點屬性值
#!/bin/bash

78.Unicode檔案轉GB2312格式
#!/bin/sh
iconv -f ucs2 -t  gbk %%1 -o %%2

79.開源程式庫Xercesc-C++程式碼工程中內聯80.提取包含標頭檔案列表
#!/bin/bash

81.GB2312檔案轉Unicode格式
#!/bin/sh
iconv -f gbk -t  ucs2 %%1 -o %%2

82.Java程式打包
#!/bin/bash

83.UTF-8檔案轉Unicode格式
#!/bin/bash
iconv -f utf8 -t  ucs2 %%1 -o %%2

84.建立PDF文件
#!/bin/bash

85.建立Word文件
#!/bin/bash

86.快速高效的檔案加密
#!/bin/bash

87.從CSV檔案構造XML文件
#!/bin/bash

88.從XML文件生成CSV檔案
#!/bin/bash

89.模擬鍵盤輸入字串
#!/bin/bash

90.提取PDF檔案中的文字
#!/bin/bash

91.操作記憶體對映檔案
#!/bin/bash
91.1傳送記憶體對映資料
#!/bin/bash

91.2接收記憶體對映資料
#!/bin/bash

92.重定向windows控制檯程式的輸出資訊
#!/bin/bash

93.基數轉序數
#!/bin/bash

94.數字月份轉英文
#!/bin/bash

95.報表相關
#!/bin/bash

96.根據程序名獲取程序ID
#!/bin/bash
pidof %%1 -s

96.BCP匯入
#!/bin/bash

97.BCP匯出
#!/bin/bash


98.計算檔案MD5值
#!/bin/bash
md5sum "%%1"

99.計算獲取資料夾中檔案的MD5值
#!/bin/bash

100.複製一個目錄下所有檔案到一個資料夾中
#!/bin/bash
cp $(find "%%1" -name *.*) "%%2"

101.移動一個目錄下所有檔案到一個資料夾中
#!/bin/bash
mv $(find "%%1" -name *.*) "%%2"

102.檔案RSA高階加密
十進位制到十六進位制
typeset -i16 BASE_16_NUM
BASE_16_NUM=%%1
echo $BASE_16_NUM

八進位制到十六進位制
#!/bin/bash
typeset -i16 BASE_16_NUM
BASE_16_NUM=8#%%1
echo $BASE_16_NUM

十進位制到八進位制
#!/bin/bash
printf %o %%1; echo

十進位制到十六進位制
#!/bin/bash
printf %x %%1; echo

103.計算檔案大小
#!/bin/bash
wc "%%1"

104.計算資料夾的大小
#!/sbin/ksh
dir=%%1
(cd $dir;pwd)
find $dir -type d -print | du | awk '{print $2, "== ("$1/2"kb)"}' |sort -f |
sed -e "s,[^ /]*/([^ /]*) ==,|--1," -e"s,[^ /]*/,| ,g"

105.快速獲得當前程式的驅動器、路徑、檔名和副檔名

106.磁碟剩餘空間計算
#!/bin/bash
df -k

107.獲取當前程式程序ID
#!/bin/bash
pidof %%1 -s

108.全盤搜尋檔案
#!/bin/bash
#updatedb
#locate %%1
slocate %%1

109.獲得當前登入的使用者名稱
#!/bin/bash
whoami

110.獲得所有使用者名稱
#!/bin/bash
who

111.建立MySQL管理使用者
#!/bin/bash
mysqladmin -u root password %%1

112.管理MySQL資料庫伺服器
#!/bin/bash
112.1.啟動MySQL資料庫伺服器
mysqld -console

112.2.登入MySQL資料庫伺服器
112.2.1.登入本地MySQL資料庫伺服器
mysql -uroot -p%%1

112.2.2.登入遠端MySQL資料庫伺服器
mysql -h %%1 -u %%2 -p%%3

112.3.關閉MySQL資料庫伺服器
mysqladmin -u root shutdown
#pkill -9 mysql

112.4.測試MySQL資料庫伺服器
mysqlshow || mysqlshow -u root mysql || mysqladmin version status || mysql test

113.MySQL執行查詢
#!/bin/sh
mysqladmin -u %%1 -p%%2 SELECT * INTO OUTFILE './bestlovesky.xls' FROM bestlovesky WHERE 1 ORDER BY id DESC  LIMIT 0, 50;

mysql -u %%1 -p%%2 -e "SELECT * INTO OUTFILE './bestlovesky.xls' FROM bestlovesky WHERE 1 ORDER BY id DESC  LIMIT 0, 50;"

114.建立Oracle管理使用者
#!/bin/sh
114.1.建立新使用者
create user test identified by test default tablespace ts_test temporary
tablespace temp;

114.2.給使用者角色特權
grant connect,resource to test;

115.登入Oracle資料庫
#!/bin/bash
sqlplusw
sqlplus /nolog
conn username/
[email protected]

conn system/[email protected]
conn sys/[email protected] as sysdba

115.建立Oracle表空間
#!/bin/bash
conn [email protected]
create tablespace ts_test datafile '/data2/oradata/ciis/ts_test01.dbf' size

116.新增Oracle資料檔案
#!/bin/bash
alter tablespace ts_test add datafile '/data2/oradata/ciis/ts_test02.dbf' size

117.檢視Oracle表空間大小
#!/bin/bash
desc DBA_DATA_FILES

118.檢視Oracle剩餘表空間大小
#!/bin/bash
desc DBA_FREE_SPACE

119.檢視Oracle當前使用者表名
#!/bin/bash
select * from tab;

120.Oracle建立索引
#!/bin/bash
CREATE INDEX idx_book_bookid ON book(bookname);

121.Oracle建立主鍵約束
#!/bin/bash
ALTER TABLE book ADD CONSTRAINT pk_book_bookid PRIMARY KEY (bookid);

122.Oracle顯示錶結構
#!/bin/bash
desc book

123.Oracle查看錶的索引
#!/bin/bash
column index_name format a30
select table_name, index_name from user_indexes;

124.Oracle檢視索引列
#!/bin/bash
select table_name, index_name, column_name, column_position from user_ind_columns;

125.Oracle檢視資料段佔空間大小
#!/bin/bash
desc user_segments

126.Oracle查看錶佔空間大小
#!/bin/bash
select segment_name,segment_type,bytes from user_segments where segment_type='TABLE';

127.安全刪除USB
#!/bin/bash
rundll32.exe shell32.dll,Control_RunDLL hotplug.dll

128.開啟SQL Server Management Studio
#!/bin/bash
sqlwb %%1.sql

129.MySQL資料庫匯出備份
#!/bin/bash
mysqldump -u %%1 -p %%2 %%3>%%4.sql
mysqldump --opt test > mysql.test //將資料庫test匯出到mysql.test檔案,後面是一個文字檔案
mysqldump -u root -p123456 --databases dbname > mysql.dbname //就是把資料庫dbname匯出到檔案mysql.dbname中。

130.MySQL資料庫資料匯入
mysql -u %%1 -p %%2 %%3<%%4.sql
mysqlimport -u root -p123456 < mysql.dbname
將文字資料匯入資料庫:
文字資料的欄位之間用tab鍵隔開
use test
load data local infile "檔名" into table 表名;
eg: load data local infile "D:/mysql.txt" into table mytable;
匯入.sql 檔案命令
use database
source d:/mysql.sql;

131.MySQL資料庫檢查
mysqlcheck -o %%3 -u %%1 -p %%2

132.MySQL資料表文件修復
myisamchk -B -o %%1.myd

1,檢視資料庫狀態 及啟動停止
/etc/init.d/mysqld status
/etc/init.d/mysqld start
/etc/init.d/mysqld stop

2,給使用者配置初始密碼123456:
mysqladmin -u root -password 123456

3,修改root使用者密碼為 abc123
mysqladmin -u root -p123456 password abc123

4,如果想去掉密碼:
mysqladmin -u root -pabc123 password ""

5,root連線資料庫有密碼和無密碼:
mysql -u root(-uroot) -p
mysql

6,增加使用者 test1 密碼 abc,讓它可以在任何主機上登入,並對所有資料庫有查詢,插入,修改,刪除的許可權:
格式: grant select on 資料庫.* to 使用者名稱@登入主機 identified by "密碼"
grant select,insert,update,delete on *.* to
[email protected]
"%" Identified by "abc";

8,增加一個使用者test2,讓它只可以在localhost上登入,並可以對資料庫mydb進行查詢,插入,修改,刪除的操作,
這樣使用者即使使用知道test2的密碼,他也無法從internet 上直接訪問資料庫,只能通過mysql主機上的web頁面來訪問。
grant select,insert,update,delete on mydb.* to [email protected] identified by "abc";
grant select,insert,update,delete on mydb.* to
[email protected]
identified by ""; 設定無密碼

9,顯示資料庫列表:
show databases;
use mysql 開啟庫
show tables;

10,表的操作
describle 表名; 顯示資料表的結構
create database 庫名;
drop database 庫名;
create table 表名(欄位設定列表)
drop table 表名;
delete from 表名;清空表記錄
select * from 表名; 顯示錶中的記錄
insert into 表名 values(, ,)

alter table 表名 add column <欄位名><欄位選項>

133.檢查端口占用
#!/bin/bash
netstat -ano

134.Linux下檢查Apache是否安裝
#!/bin/bash
rpm -qa | grep httpd

135.Linux下啟動Apache服務
#!/bin/bash
service httpd start

136.Linux下停止Apache服務
#!/bin/bash
service httpd stop

137.Linux下重新啟動Apache服務
#!/bin/bash
service httpd restart

138.Linux下自動載入Apache 服務
#!/bin/bash
chkconfig - level 3 httpd on

139.Linux下不自動載入Apache 服務
#!/bin/bash
chkconfig - level 3 httpd off

140.Linux下檢查VSFTP是否安裝
#!/bin/bash
rpm -qa | grep vsftpd

141.Linux下啟動VSFTP服務
#!/bin/bash
service vsftpd start

142.Linux下停止VSFTP服務
#!/bin/bash
service vsftpd stop

143.Linux下重新啟動VSFTP服務
#!/bin/bash
service vsftpd restart

144.Linux下檢查VSFTP是否被啟動
#!/bin/bash
pstree | grep vsftpd

145.Linux下檢查Sendmail是否安裝
#!/bin/bash
rpm -qa | grep sendmail

146.Linux下啟動Sendmail服務
#!/bin/bash
service sendmail start

147.Linux下停止Sendmail服務
#!/bin/bash
service sendma stop

148.Linux下重新啟動Sendmail服務
#!/bin/bash
service sendmail restart

149.Linux下自動載入Sendmail 服務
#!/bin/bash
chkconfig - level 3 sendmail on

150.Linux下不自動載入Sendmail 服務
#!/bin/bash
chkconfig - level 3 sendmail off

151.Linux下文字圖形介面配置啟動服務
#!/bin/bash
ntsysv

152.以陣列的方式刪除資料夾

153.GCC批量編譯
#!/bin/bash
find -type f \( -iname '*.c' -o -iname '*.cpp' \) -print |
while read filename
do
    case "$filename" in
    *.c)
      gcc "$filename" -o "$(dirname "$filename")"/"$(basename "$filename" .c)"
        ;;
    *.cpp)
        gcc "$filename" -o "$(dirname "$filename")"/"$(basename "$filename" .cpp)"
        ;;
    esac
done

154.批量賦予可執行許可權
#!/bin/bash
find "$PWD" -type f \( -iname '*.sh' -o  -iname '*.csh' -o  -iname '*.ksh' -o -iname '*.pl' -o -iname '*.bin' -o -iname '*.run' -o -iname '*.bundle' -o -iname '*.rb' -o -iname '*.py' \) -print0 | xargs -0 chmod +x

#!/bin/bash
for file in *.sh *.pl *.bin *.run *.bundle *.rb *.py
do
if [[ ! "$file" =~ \*.[A-Za-z]+ ]]; then
chmod +x "$(file)"
fi
done
OLDIFS=$IFS
IFS=:
for path in $( find $(pwd) -type d -printf "%p$IFS")
do
for file in $path/*.sh $path/*.pl $path/*.bin $path/*.run $path/*.bundle $path/*.rb $path/*.py
do
if [[ ! "$file" =~ \*.[A-Za-z]+ ]]; then
chmod +x "$(path)/$(file)"
fi
done
done
IFS=$OLDIFS

155.批量執行
#!/bin/bash
find -type f \( -iname '*.sh' -o  -iname '*.csh' -o  -iname '*.ksh' -o -iname '*.pl' -o -iname '*.bin' -o -iname '*.run' -o -iname '*.bundle' -o -iname '*.bin' -o -iname '*.class' -o -iname '*.rpm' -o -iname '*.rb' -o -iname '*.py' -o -iname '*.jar' \) -print |
while read filename
do
    case "$filename" in
    *.sh | *.csh | *.ksh)
if [ ! "./""$(basename $filename)" = $0 ]; then
        xterm -e "$filename"
fi
        ;;
    *.pl)
        xterm -e perl "$filename"
        ;;
    *.bin | *.run | *.bundle)
        xterm -e "$filename"
        ;;
    *.class)
        xterm -e java "$(dirname "$filename")"/"$(basename "$filename" .class)"
        ;;
    *.rpm)
        xterm -e rpm -ivh "$filename"
        ;;
    *.rb)
        xterm -e ruby "$filename"
        ;;
    *.py)
        xterm -e python "$filename"
        ;;
    *.jar)
        xterm -e java -jar "$filename"
        ;;
    esac
done

#!/bin/bash
find -maxdepth 1 -t