EricJoy2048 opened a new issue, #5841:
URL: https://github.com/apache/seatunnel/issues/5841

   ### Search before asking
   
   - [X] I had searched in the 
[issues](https://github.com/apache/seatunnel/issues?q=is%3Aissue+label%3A%22bug%22)
 and found no similar issues.
   
   
   ### What happened
   
   I test use `\n\n` as row delimiter to write data to file and read data from 
file. I found write data is fine but read data will treating blank lines as 
data content.
   
   
   
![image](https://github.com/apache/seatunnel/assets/32193458/c4dc815b-842d-429b-8f64-6f6008d4ceaf)
   
   
   ### SeaTunnel Version
   
   all
   
   ### SeaTunnel Config
   
   ```conf
   First: write data in to file.
   
   env {
   "job.mode"=BATCH
   "job.name"="v26_virtu_batch_mysql_to_localfile_lzo"
   }
   source {
   Jdbc {
       "split.inverse-sampling.rate"=1000
       parallelism=1
       "result_table_name"=Table11539883745824
       query="SELECT `id`, `smallint_col`, `integer_col`, `bigint_col`, 
`decimal_col`, `numeric_col`, `real_col`, `double_col`, `bigserial_col`, 
`varchar_col`, `date_col`, `timestamp_col` FROM 
`qa_source`.`v26_virtu_batch_mysql_to_localfile_lzo`"
       "table_path"="qa_source.v26_virtu_batch_mysql_to_localfile_lzo"
       password="BRmk34HkyUvE/Um0Qpmg=="
       driver="com.mysql.cj.jdbc.Driver"
       "xa_data_source_class_name"="com.mysql.cj.jdbc.MysqlXADataSource"
       
url="jdbc:mysql://datasource01:3306/offline_where?rewriteBatchedStatements=true"
       user="QCcLGiNruBrrawgM3EeQDQ=="
   }
   }
   transform {
   }
   sink {
   LocalFile {
       "is_enable_transaction"="true"
       "source_table_name"=Table11539883745824
       path="/data/file_lzo/"
       "file_format_type"=TEXT
       "date_format"=yyyy-MM-dd
       "field_delimiter"=","
       "row_delimiter"="\n\n"
       "enable_header_write"="true"
       "sink_columns"=[]
       "compress_codec"=LZO
   }
   }
   ```
   
   And then will write data to file use `\n\n` as row delimiter. The file like 
this:
   
   ```
   1,1,3,4,5
   
   tk,6j,3,4,5
   
   6,7,7,7,7
   ```
   
   Second, read this file.
   
   ```
   env {
   "job.mode"=BATCH
   "job.name"="v26_localfile_lzo_to_ftpfile"
   }
   source {
   LocalFile {
       parallelism=1
       "result_table_name"=Table11574403569696
       schema {
           table="local_file_lzo_001"
           "schema_first"=false
           comment=null
           columns=[
               {
                   "nullable"=true
                   name=id
                   type=int
               },
               {
                   "nullable"=false
                   name="smallint_col"
                   type=smallint
               },
               {
                   "nullable"=false
                   name="integer_col"
                   type=int
               },
               {
                   "nullable"=false
                   name="bigint_col"
                   type=bigint
               },
               {
                   "nullable"=false
                   name="decimal_col"
                   type="decimal(38, 18)"
               },
               {
                   "nullable"=false
                   name="numeric_col"
                   type="decimal(38, 18)"
               },
               {
                   "nullable"=false
                   name="real_col"
                   type=float
               },
               {
                   "nullable"=false
                   name="double_col"
                   type=double
               },
               {
                   "nullable"=false
                   name="bigserial_col"
                   type=int
               },
               {
                   columnLength=255
                   "nullable"=false
                   name="varchar_col"
                   type=string
               },
               {
                   "nullable"=false
                   name="date_col"
                   type=date
               },
               {
                   "nullable"=false
                   name="timestamp_col"
                   type=timestamp
               }
           ]
       }
       path="/data/file_lzo/"
       "file_format_type"=TEXT
       "field_delimiter"=","
       "row_delimiter"="\n\n"
       "skip_header_row_number"="1"
       "compress_codec"=LZO
   }
   }
   transform {
   }
   sink {
   FtpFile {
       "tmp_path"="/data/vsftp_path/tmp/"
       "source_table_name"=Table11574403569696
       path="/data/vsftp_path/"
       "file_format_type"=TEXT
       "field_delimiter"=","
       "row_delimiter"="\n\n"
       "enable_header_write"="true"
       "compress_codec"=NONE
       password="IYkHGuVSCu6ajx2W5BXWrA=="
       user="EgRnF7RCsH1yBGhjmfGRag=="
   }
   }
   
   ```
   
   But the source treating blank lines as data content.
   ```
   
   
   ### Running Command
   
   ```shell
   seatunnel.sh -c test.conf
   ```
   
   
   ### Error Exception
   
   ```log
   No.
   ```
   
   
   ### Zeta or Flink or Spark Version
   
   _No response_
   
   ### Java or Scala Version
   
   _No response_
   
   ### Screenshots
   
   _No response_
   
   ### Are you willing to submit PR?
   
   - [ ] Yes I am willing to submit a PR!
   
   ### Code of Conduct
   
   - [X] I agree to follow this project's [Code of 
Conduct](https://www.apache.org/foundation/policies/conduct)
   


-- 
This is an automated message from the Apache Git Service.
To respond to the message, please log on to GitHub and use the
URL above to go to the specific comment.

To unsubscribe, e-mail: [email protected]

For queries about this service, please contact Infrastructure at:
[email protected]

Reply via email to