sql_loader使用指南

sql_Loader

 


需要寫控制文件,程序根據控制文件從數據文件中讀數據寫入到數據庫中
條件:
一個數據庫、一個需要裝載的展開文件、一個描述展開文件的控制文件。可以生成壞文件bad(引起錯誤的記錄被寫入)、discard丟失文件(不能選擇標準的記錄被寫入)、log日誌文件
direct=true
直接裝入
裝載方式:
        INSERT
:指定要裝載一個空表
        APPEND
:添加方式
        REPLACE
:替代方式,如果數據存在,則刪除
        TRUNCATE
:先清空表
常規導入先生成常規的SQL語句,再執行該語句,使用數組接口。
直接路局導入:先形成數據塊,直接寫入塊,速度非常快,但受到許多約束

[目錄]



導入csv文件到數據庫


1.
庫結構
SQL> desc testLoad
Name                                      Null?    Type
----------------------------------------- -------- ----------------------------
F1                                        NOT NULL NUMBER
F2                                                 VARCHAR2(30)
F3                                                 DATE

2.控制文件testLoad.ctl

LOAD DATA
        INFILE 'testLoad.csv'
        BADFILE 'testLoad'                -- 無法插入的記錄被放入該文件中
        APPEND
        INTO TABLE testLoad
        TRAILING NULLCOLS
        (
                F1        INTEGER EXTERNAL TERMINATED BY ",",
                F2        CHAR TERMINATED BY ",",
                F3        DATE "RRRR-MM-DD" TERMINATED BY ","
        )

3.數據庫文件testLoad.csv
1,one row,1901-01-01
2,two row,1902-01-01
3,three row,1903-01-01
4,four row,1904-01-01
5,five row,1905-01-01
6,six row,1906-01-01
7,serven row,1907-01-01
8,eight row,1908-01-01
9,nine row,1909-01-01
10,ten row

導入固定格式的文件
1.
庫結構
SQL> desc testLoad
Name                                      Null?    Type
----------------------------------------- -------- ----------------------------
F1                                        NOT NULL NUMBER
F2                                                 VARCHAR2(30)
F3                                                 DATE

2.控制文件testLoad.ctl

LOAD DATA
        INFILE 'testLoad.csv'
        BADFILE 'testLoad'                -- 無法插入的記錄被放入該文件中
        APPEND
        INTO TABLE testLoad
        TRAILING NULLCOLS
        (
                F1        POSITION(1:0) INTEGER EXTERNAL,
                F2        POSITION(2:12) CHAR "upper(:f2)",        -- 可以使用oracle的函數,但不能使用僞列
                F3        POSITION(13:22) DATE "RRRR-MM-DD"
        )

3.數據庫文件testLoad
1one row    1901-01-01
2two row    1902-01-01
3three row  1903-01-01
4four row   1904-01-01
5five row   1905-01-01
6six row    1906-01-01
7serven row 1907-01-01
8eight row  1908-01-01
9nine row   1909-01-01

導入大量文本


1.
庫結構
SQL> desc testLoad
Name                                      Null?    Type
----------------------------------------- -------- ----------------------------
F1                                        NOT NULL NUMBER
F2                                                 VARCHAR2(30)
F3                                                 DATE
F4                                                   CLOB

2.控制文件testLoad.ctl

LOAD DATA
        INFILE 'testLoad.csv'
        BADFILE 'testLoad'                -- 無法插入的記錄被放入該文件中
        APPEND
        INTO TABLE testLoad
        TRAILING NULLCOLS
        (
                F1        INTEGER EXTERNAL TERMINATED BY ",",
                F2        CHAR TERMINATED BY ",",
                F3        DATE "RRRR-MM-DD" TERMINATED BY ",",
                F4_file_name FILLER CHAR TERMINATED BY ",",
                F4        LOBFILE(F4_file_name)
                        TERMINATED BY EOF
        )

3.數據庫文件testLoad.csv
1,one row,1901-01-01,note1.txt
2,two row,1902-01-01,note2.txt
3,three row,1903-01-01,note3.txt
4,four row,1904-01-01,note4.txt
5,five row,1905-01-01,note5.txt
6,six row,1906-01-01,note6.txt
7,serven row,1907-01-01,note7.txt
8,eight row,1908-01-01,note8.txt
9,nine row,1909-01-01,note9.txt

執行語句:

sqlldr userid=zhuanxian/zx control=input1.ctl

***** 指定不裝載那一列
LOAD DATA
INFILE *
INTO TABLE DEPT
REPLACE
FIELDS TERMINATED BY ',' OPTIONALLY ENCLOSED BY '"'
( DEPTNO,
FILLER_1 FILLER, //
下面的 "Something Not To Be Loaded" 將不會被裝載
DNAME,
LOC
)
BEGINDATA
20,Something Not To Be Loaded,Accounting,"Virginia,USA"

sql load的一點小總結

以下是本人對sql load 的一些運用總結 不足之處還多包涵

sqlldr userid=lgone/tiger control=a.ctl
LOAD DATA
INFILE 't.dat' //
要導入的文件
// INFILE 'tt.date' //
導入多個文件
// INFILE * //
要導入的內容就在control文件裏 下面的BEGINDATA後面就是導入的內容

INTO TABLE table_name //
指定裝入的表
BADFILE 'c:bad.txt' //
指定壞文件地址

*************
以下是4種裝入表的方式
APPEND //
原先的表有數據 就加在後面
// INSERT //
裝載空表 如果原先的表有數據 sqlloader會停止 默認值
// REPLACE //
原先的表有數據 原先的數據會全部刪除
// TRUNCATE //
指定的內容和replace的相同 會用truncate語句刪除現存數據

*************
指定的TERMINATED可以在表的開頭 也可在表的內部字段部分
FIELDS TERMINATED BY ',' OPTIONALLY ENCLOSED BY '"'
//
裝載這種數據: 10,lg,"""lg""","lg,lg"
//
在表中結果: 10 lg "lg" lg,lg
// TERMINATED BY X '09' //
以十六進制格式 '09' 表示的
// TERMINATED BY WRITESPACE //
裝載這種數據: 10 lg lg

TRAILING NULLCOLS *************
表的字段沒有對應的值時允許爲空

*************
下面是表的字段
(
col_1 , col_2 ,col_filler FILLER // FILLER
關鍵字 此列的數值不會被裝載
//
: lg,lg,not 結果 lg lg
)
//
當沒聲明FIELDS TERMINATED BY ','
// (
// col_1 [interger external] TERMINATED BY ',' ,
// col_2 [date "dd-mon-yyy"] TERMINATED BY ',' ,
// col_3 [char] TERMINATED BY ',' OPTIONALLY ENCLOSED BY 'lg'
// )
//
當沒聲明FIELDS TERMINATED BY ','用位置告訴字段裝載數據
// (
// col_1 position(1:2),
// col_2 position(3:10),
// col_3 position(*:16), //
這個字段的開始位置在前一字段的結束位置
// col_4 position(1:16),
// col_5 position(3:10) char(8) //
指定字段的類型
// )

BEGINDATA //
對應開始的 INFILE * 要導入的內容就在control文件裏
10,Sql,what
20,lg,show

=====================================================================================
////////////
注意begindata後的數值前面不能有空格

1 *****
普通裝載
LOAD DATA
INFILE *
INTO TABLE DEPT
REPLACE
FIELDS TERMINATED BY ',' OPTIONALLY ENCLOSED BY '"'
(DEPTNO,
DNAME,
LOC
)
BEGINDATA
10,Sales,"""USA"""
20,Accounting,"Virginia,USA"
30,Consulting,Virginia
40,Finance,Virginia
50,"Finance","",Virginia // loc
列將爲空
60,"Finance",,Virginia // loc
列將爲空

2 ***** FIELDS TERMINATED BY WHITESPACE
FIELDS TERMINATED BY x'09' 的情況
LOAD DATA
INFILE *
INTO TABLE DEPT
REPLACE
FIELDS TERMINATED BY WHITESPACE
-- FIELDS TERMINATED BY x'09'
(DEPTNO,
DNAME,
LOC
)
BEGINDATA
10 Sales Virginia

3 *****
指定不裝載那一列
LOAD DATA
INFILE *
INTO TABLE DEPT
REPLACE
FIELDS TERMINATED BY ',' OPTIONALLY ENCLOSED BY '"'
( DEPTNO,
FILLER_1 FILLER, //
下面的 "Something Not To Be Loaded" 將不會被裝載
DNAME,
LOC
)
BEGINDATA
20,Something Not To Be Loaded,Accounting,"Virginia,USA"

4 ***** position
的列子
LOAD DATA
INFILE *
INTO TABLE DEPT
REPLACE
( DEPTNO position(1:2),
DNAME position(*:16), //
這個字段的開始位置在前一字段的結束位置
LOC position(*:29),
ENTIRE_LINE position(1:29)
)
BEGINDATA
10Accounting Virginia,USA

5 *****
使用函數 日期的一種表達 TRAILING NULLCOLS的使用
LOAD DATA
INFILE *
INTO TABLE DEPT
REPLACE
FIELDS TERMINATED BY ','
TRAILING NULLCOLS //
其實下面的ENTIRE_LINEBEGINDATA後面的數據中是沒有直接對應
//
的列的值的 如果第一行改爲 10,Sales,Virginia,1/5/2000,, 就不用TRAILING NULLCOLS
(DEPTNO,
DNAME "upper(:dname)", //
使用函數
LOC "upper(:loc)",
LAST_UPDATED date 'dd/mm/yyyy', //
日期的一種表達方式 還有'dd-mon-yyyy'
ENTIRE_LINE ":deptno||:dname||:loc||:last_updated"
)
BEGINDATA
10,Sales,Virginia,1/5/2000
20,Accounting,Virginia,21/6/1999
30,Consulting,Virginia,5/1/2000
40,Finance,Virginia,15/3/2001

6 *****
使用自定義的函數 // 解決的時間問題
create or replace
function my_to_date( p_string in varchar2 ) return date
as
type fmtArray is table of varchar2(25);

l_fmts fmtArray := fmtArray( 'dd-mon-yyyy', 'dd-month-yyyy',
'dd/mm/yyyy',
'dd/mm/yyyy hh24:mi:ss' );
l_return date;
begin
for i in 1 .. l_fmts.count
loop
begin
l_return := to_date( p_string, l_fmts(i) );
exception
when others then null;
end;
EXIT when l_return is not null;
end loop;

if ( l_return is null )
then
l_return :=
new_time( to_date('01011970','ddmmyyyy') + 1/24/60/60 *
p_string, 'GMT', 'EST' );
end if;

return l_return;
end;
/

LOAD DATA
INFILE *
INTO TABLE DEPT
REPLACE
FIELDS TERMINATED BY ','
TRAILING NULLCOLS
(DEPTNO,
DNAME "upper(:dname)",
LOC "upper(:loc)",
LAST_UPDATED "my_to_date( :last_updated )" //
使用自定義的函數
)
BEGINDATA
10,Sales,Virginia,01-april-2001
20,Accounting,Virginia,13/04/2001
30,Consulting,Virginia,14/04/2001 12:02:02
40,Finance,Virginia,987268297
50,Finance,Virginia,02-apr-2001
60,Finance,Virginia,Not a date

7 *****
合併多行記錄爲一行記錄
LOAD DATA
INFILE *
concatenate 3 //
通過關鍵字concatenate 把幾行的記錄看成一行記錄
INTO TABLE DEPT
replace
FIELDS TERMINATED BY ','
(DEPTNO,
DNAME "upper(:dname)",
LOC "upper(:loc)",
LAST_UPDATED date 'dd/mm/yyyy'
)
BEGINDATA
10,Sales, //
其實這3行看成一行 10,Sales,Virginia,1/5/2000
Virginia,
1/5/2000
//
這列子用 continueif list="," 也可以
告訴sqlldr在每行的末尾找逗號 找到逗號就把下一行附加到上一行

LOAD DATA
INFILE *
continueif this(1:1) = '-' //
找每行的開始是否有連接字符 - 有就把下一行連接爲一行
//
-10,Sales,Virginia,
// 1/5/2000
就是一行 10,Sales,Virginia,1/5/2000
//
其中1:1 表示從第一行開始 並在第一行結束 還有continueif next continueif list最理想
INTO TABLE DEPT
replace
FIELDS TERMINATED BY ','
(DEPTNO,
DNAME "upper(:dname)",
LOC "upper(:loc)",
LAST_UPDATED date 'dd/mm/yyyy'
)
BEGINDATA //
但是好象不能象右面的那樣使用
-10,Sales,Virginia, -10,Sales,Virginia,
1/5/2000 1/5/2000
-40, 40,Finance,Virginia,13/04/2001
Finance,Virginia,13/04/2001

8 ***** 載入每行的行號

load data
infile *
into table t
replace
( seqno RECNUM //
載入每行的行號
text Position(1:1024))
BEGINDATA
fsdfasj //
自動分配一行號給載入 t seqno字段 此行爲 1
fasdjfasdfl //
此行爲 2 ...

9 *****
載入有換行符的數據
注意: unix windows 不同 & /n
< 1 >
使用一個非換行符的字符
LOAD DATA
INFILE *
INTO TABLE DEPT
REPLACE
FIELDS TERMINATED BY ','
TRAILING NULLCOLS
(DEPTNO,
DNAME "upper(:dname)",
LOC "upper(:loc)",
LAST_UPDATED "my_to_date( :last_updated )",
COMMENTS "replace(:comments,'n',chr(10))" // replace
的使用幫助轉換換行符
)
BEGINDATA
10,Sales,Virginia,01-april-2001,This is the SalesnOffice in Virginia
20,Accounting,Virginia,13/04/2001,This is the AccountingnOffice in Virginia
30,Consulting,Virginia,14/04/2001 12:02:02,This is the ConsultingnOffice in Virginia
40,Finance,Virginia,987268297,This is the FinancenOffice in Virginia

< 2 >
使用fix屬性
LOAD DATA
INFILE demo17.dat "fix 101"
INTO TABLE DEPT
REPLACE
FIELDS TERMINATED BY ','
TRAILING NULLCOLS
(DEPTNO,
DNAME "upper(:dname)",
LOC "upper(:loc)",
LAST_UPDATED "my_to_date( :last_updated )",
COMMENTS
)
demo17.dat
10,Sales,Virginia,01-april-2001,This is the Sales
Office in Virginia
20,Accounting,Virginia,13/04/2001,This is the Accounting
Office in Virginia
30,Consulting,Virginia,14/04/2001 12:02:02,This is the Consulting
Office in Virginia
40,Finance,Virginia,987268297,This is the Finance
Office in Virginia

//
這樣裝載會把換行符裝入數據庫 下面的方法就不會 但要求數據的格式不同

LOAD DATA
INFILE demo18.dat "fix 101"
INTO TABLE DEPT
REPLACE
FIELDS TERMINATED BY ',' OPTIONALLY ENCLOSED BY '"'
TRAILING NULLCOLS
(DEPTNO,
DNAME "upper(:dname)",
LOC "upper(:loc)",
LAST_UPDATED "my_to_date( :last_updated )",
COMMENTS
)
demo18.dat
10,Sales,Virginia,01-april-2001,"This is the Sales
Office in Virginia"
20,Accounting,Virginia,13/04/2001,"This is the Accounting
Office in Virginia"
30,Consulting,Virginia,14/04/2001 12:02:02,"This is the Consulting
Office in Virginia"
40,Finance,Virginia,987268297,"This is the Finance
Office in Virginia"

< 3 >
使用var屬性
LOAD DATA
INFILE demo19.dat "var 3"
// 3
告訴每個記錄的前3個字節表示記錄的長度 如第一個記錄的 071 表示此記錄有 71 個字節
INTO TABLE DEPT
REPLACE
FIELDS TERMINATED BY ','
TRAILING NULLCOLS
(DEPTNO,
DNAME "upper(:dname)",
LOC "upper(:loc)",
LAST_UPDATED "my_to_date( :last_updated )",
COMMENTS
)
demo19.dat
07110,Sales,Virginia,01-april-2001,This is the Sales
Office in Virginia
07820,Accounting,Virginia,13/04/2001,This is the Accounting
Office in Virginia
08730,Consulting,Virginia,14/04/2001 12:02:02,This is the Consulting
Office in Virginia
07140,Finance,Virginia,987268297,This is the Finance
Office in Virginia

< 4 >
使用str屬性
//
最靈活的一中 可定義一個新的行結尾符 win 回車換行 : chr(13)||chr(10)

此列中記錄是以 a|rn 結束的
select utl_raw.cast_to_raw('|'||chr(13)||chr(10)) from dual;
結果 7C0D0A

LOAD DATA
INFILE demo20.dat "str X'7C0D0A'"
INTO TABLE DEPT
REPLACE
FIELDS TERMINATED BY ','
TRAILING NULLCOLS
(DEPTNO,
DNAME "upper(:dname)",
LOC "upper(:loc)",
LAST_UPDATED "my_to_date( :last_updated )",
COMMENTS
)
demo20.dat
10,Sales,Virginia,01-april-2001,This is the Sales
Office in Virginia|
20,Accounting,Virginia,13/04/2001,This is the Accounting
Office in Virginia|
30,Consulting,Virginia,14/04/2001 12:02:02,This is the Consulting
Office in Virginia|
40,Finance,Virginia,987268297,This is the Finance
Office in Virginia|





==============================================================================
象這樣的數據 nullif 子句

10-jan-200002350Flipper seemed unusually hungry today.
10510-jan-200009945Spread over three meals.

id position(1:3) nullif id=blanks //
這裏可以是blanks 或者別的表達式
//
下面是另一個列子 第一行的 1 在數據庫中將成爲 null
LOAD DATA
INFILE *
INTO TABLE T
REPLACE
(n position(1:2) integer external nullif n='1',
v position(3:8)
)
BEGINDATA
1 10
20lg
------------------------------------------------------------

如果是英文的日誌 格式,可能需要修改環境變量 nls_lang or nls_date_format

發表評論
所有評論
還沒有人評論,想成為第一個評論的人麼? 請在上方評論欄輸入並且點擊發布.
相關文章