FileUtil.getTotalLines()支持CR换行符

This commit is contained in:
Looly 2024-08-29 09:50:07 +08:00
parent 63b2f7c70d
commit c459a0f613
5 changed files with 42 additions and 7 deletions

View File

@ -2,9 +2,10 @@
# 🚀Changelog
-------------------------------------------------------------------------------------------------------------
# 5.8.32(2024-08-24)
# 5.8.32(2024-08-29)
### 🐣新特性
* 【core 】 FileUtil.getTotalLines()支持CR换行符issue#IAMZYR@Gitee
### 🐞Bug修复
* 【http 】 修复getFileNameFromDisposition不符合规范问题issue#IAKBPD@Gitee

View File

@ -572,8 +572,8 @@ public class FileUtil extends PathUtil {
bufferSize = 1024;
}
try (InputStream is = getInputStream(file)) {
byte[] c = new byte[bufferSize];
int readChars = is.read(c);
byte[] chars = new byte[bufferSize];
int readChars = is.read(chars);
if (readChars == -1) {
// 空文件返回0
return 0;
@ -584,23 +584,35 @@ public class FileUtil extends PathUtil {
// 如果多行最后一行无换行符最后一行需要单独计数
// 如果多行最后一行有换行符则空行算作一行
int count = 1;
byte pre;
byte c = 0;
while (readChars == bufferSize) {
for (int i = 0; i < bufferSize; i++) {
if (c[i] == CharUtil.LF) {
pre = c;
c = chars[i];
// 换行符兼容MAC
if (c == CharUtil.LF || pre == CharUtil.CR) {
++count;
}
}
readChars = is.read(c);
readChars = is.read(chars);
}
// count remaining characters
while (readChars != -1) {
for (int i = 0; i < readChars; i++) {
if (c[i] == CharUtil.LF) {
pre = c;
c = chars[i];
if (c == CharUtil.LF || pre == CharUtil.CR) {
++count;
}
}
readChars = is.read(c);
readChars = is.read(chars);
}
// 最后一个字符为换行符则单独计数行
if(c == CharUtil.CR){
++count;
}
return count;

View File

@ -532,6 +532,20 @@ public class FileUtilTest {
assertEquals(8, totalLines);
}
@Test
public void getTotalLinesCrTest() {
// 此文件最后一行有换行符则最后的空行算作一行
final int totalLines = FileUtil.getTotalLines(FileUtil.file("test_lines_cr.csv"));
assertEquals(8, totalLines);
}
@Test
public void getTotalLinesCrlfTest() {
// 此文件最后一行有换行符则最后的空行算作一行
final int totalLines = FileUtil.getTotalLines(FileUtil.file("test_lines_crlf.csv"));
assertEquals(8, totalLines);
}
@Test
public void issue3591Test() {
// 此文件最后一行末尾无换行符

View File

@ -0,0 +1 @@
# 这是一行注释,读取时应忽略 a,b,c,d 1,2,3,4 # 这是一行注释,读取时应忽略 q,w,e,r,"我是一段 带换行的内容" a,s,d,f
Can't render this file because it contains an unexpected character in line 1 and column 141.

View File

@ -0,0 +1,7 @@
# 这是一行注释,读取时应忽略
a,b,c,d
1,2,3,4
# 这是一行注释,读取时应忽略
q,w,e,r,"我是一段
带换行的内容"
a,s,d,f
Can't render this file because it has a wrong number of fields in line 2.