(improvement)(build) Add spotless during the build process. (#1639)

This commit is contained in:
lexluo09
2024-09-07 00:36:17 +08:00
committed by GitHub
parent ee15a88b06
commit 5f59e89eea
986 changed files with 15609 additions and 12706 deletions

View File

@@ -1,6 +1,5 @@
package com.hankcs.hanlp.dictionary;
import com.hankcs.hanlp.HanLP;
import com.hankcs.hanlp.collection.trie.DoubleArrayTrie;
import com.hankcs.hanlp.corpus.io.ByteArray;
@@ -8,6 +7,7 @@ import com.hankcs.hanlp.corpus.io.IOUtil;
import com.hankcs.hanlp.corpus.tag.Nature;
import com.hankcs.hanlp.utility.Predefine;
import com.hankcs.hanlp.utility.TextUtility;
import java.io.BufferedOutputStream;
import java.io.BufferedReader;
import java.io.DataOutputStream;
@@ -21,9 +21,7 @@ import java.util.List;
import java.util.TreeMap;
import java.util.stream.Collectors;
/**
* 使用DoubleArrayTrie实现的核心词典
*/
/** 使用DoubleArrayTrie实现的核心词典 */
public class CoreDictionary {
public static DoubleArrayTrie<Attribute> trie = new DoubleArrayTrie<Attribute>();
@@ -36,8 +34,13 @@ public class CoreDictionary {
if (!load(PATH)) {
throw new IllegalArgumentException("核心词典" + PATH + "加载失败");
} else {
Predefine.logger.info(PATH + "加载成功," + trie.size() + "个词条,耗时"
+ (System.currentTimeMillis() - start) + "ms");
Predefine.logger.info(
PATH
+ "加载成功,"
+ trie.size()
+ "个词条,耗时"
+ (System.currentTimeMillis() - start)
+ "ms");
}
}
@@ -75,15 +78,21 @@ public class CoreDictionary {
totalFrequency += attribute.totalFrequency;
}
Predefine.logger.info(
"核心词典读入词条" + map.size() + " 全部频次" + totalFrequency + ",耗时" + (
System.currentTimeMillis() - start)
"核心词典读入词条"
+ map.size()
+ " 全部频次"
+ totalFrequency
+ ",耗时"
+ (System.currentTimeMillis() - start)
+ "ms");
br.close();
trie.build(map);
Predefine.logger.info("核心词典加载成功:" + trie.size() + "个词条,下面将写入缓存……");
try {
DataOutputStream out = new DataOutputStream(
new BufferedOutputStream(IOUtil.newOutputStream(path + Predefine.BIN_EXT)));
DataOutputStream out =
new DataOutputStream(
new BufferedOutputStream(
IOUtil.newOutputStream(path + Predefine.BIN_EXT)));
Collection<Attribute> attributeList = map.values();
out.writeInt(attributeList.size());
for (Attribute attribute : attributeList) {
@@ -202,25 +211,18 @@ public class CoreDictionary {
return trie.get(key) != null;
}
/**
* 核心词典中的词属性
*/
/** 核心词典中的词属性 */
public static class Attribute implements Serializable {
/**
* 词性列表
*/
/** 词性列表 */
public Nature[] nature;
/**
* 词性对应的词频
*/
/** 词性对应的词频 */
public int[] frequency;
public int totalFrequency;
public String[] originals;
public String original = null;
public Attribute(int size) {
nature = new Nature[size];
frequency = new int[size];
@@ -276,8 +278,11 @@ public class CoreDictionary {
}
return attribute;
} catch (Exception e) {
Predefine.logger.warning("使用字符串" + natureWithFrequency + "创建词条属性失败!"
+ TextUtility.exceptionToString(e));
Predefine.logger.warning(
"使用字符串"
+ natureWithFrequency
+ "创建词条属性失败!"
+ TextUtility.exceptionToString(e));
return null;
}
}
@@ -404,7 +409,10 @@ public class CoreDictionary {
if (originals == null || originals.length == 0) {
return null;
}
return Arrays.stream(originals).filter(o -> o != null).distinct().collect(Collectors.toList());
return Arrays.stream(originals)
.filter(o -> o != null)
.distinct()
.collect(Collectors.toList());
}
}
@@ -431,4 +439,3 @@ public class CoreDictionary {
return load(path);
}
}