Commit 039f6610 authored by pengxin's avatar pengxin

去掉清洗数据规则。

parent aac5aa9d
...@@ -312,15 +312,11 @@ public class DatasetCleanServiceImpl extends BaseService<DatasetClean, Long> imp ...@@ -312,15 +312,11 @@ public class DatasetCleanServiceImpl extends BaseService<DatasetClean, Long> imp
} }
} }
public static void main (String [] args) {
readJsonAppendSymbol("C:\\Users\\Administrator\\Desktop\\ee_V1.json");
}
/** /**
* 解析文件去掉多余的数据,比如文件里面最后一个,多加了一个",",缺少符号[] * 解析文件去掉多余的数据,比如文件里面最后一个,多加了一个",",缺少符号[]
* @param filePath 文件地址 * @param filePath 文件地址
*/ */
private static void readJsonAppendSymbol(String filePath) { private void readJsonAppendSymbol(String filePath) {
try (FileReader fileReader = new FileReader(filePath); try (FileReader fileReader = new FileReader(filePath);
BufferedReader bufferedReader = new BufferedReader(fileReader)) { BufferedReader bufferedReader = new BufferedReader(fileReader)) {
......
...@@ -25,7 +25,6 @@ public class DataCleanerUtil { ...@@ -25,7 +25,6 @@ public class DataCleanerUtil {
badWords.add("色情"); badWords.add("色情");
badWords.add("淫秽"); badWords.add("淫秽");
badWords.add("迷信"); badWords.add("迷信");
badWords.add("黄色");
badWords.add("性行为"); badWords.add("性行为");
badWords.add("暴力"); badWords.add("暴力");
} }
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment