improve occurrence[token] condition
This commit is contained in:
parent
c13b28561d
commit
b0f2ef65d9
@ -378,14 +378,12 @@ class TextRWKV(AbstractRWKV):
|
|||||||
dd = self.pipeline.encode(i)
|
dd = self.pipeline.encode(i)
|
||||||
assert len(dd) == 1
|
assert len(dd) == 1
|
||||||
self.AVOID_REPEAT_TOKENS.add(dd[0])
|
self.AVOID_REPEAT_TOKENS.add(dd[0])
|
||||||
# self.AVOID_PENALTY_TOKENS = set()
|
self.AVOID_PENALTY_TOKENS = set()
|
||||||
# AVOID_PENALTY = (
|
AVOID_PENALTY = '\n,.:?!,。:?!"“”<>[]{}/\\|;;~`@#$%^&*()_+-=0123456789 '
|
||||||
# "\n" # \n,.:?!,。:?!"“”<>[]{}/\\|;;~`@#$%^&*()_+-=0123456789
|
for i in AVOID_PENALTY:
|
||||||
# )
|
dd = self.pipeline.encode(i)
|
||||||
# for i in AVOID_PENALTY:
|
if len(dd) == 1:
|
||||||
# dd = self.pipeline.encode(i)
|
self.AVOID_PENALTY_TOKENS.add(dd[0])
|
||||||
# assert len(dd) == 1
|
|
||||||
# self.AVOID_PENALTY_TOKENS.add(dd[0])
|
|
||||||
|
|
||||||
self.__preload()
|
self.__preload()
|
||||||
|
|
||||||
@ -410,6 +408,7 @@ class TextRWKV(AbstractRWKV):
|
|||||||
token = int(token)
|
token = int(token)
|
||||||
for xxx in occurrence:
|
for xxx in occurrence:
|
||||||
occurrence[xxx] *= self.penalty_decay
|
occurrence[xxx] *= self.penalty_decay
|
||||||
|
if token not in self.AVOID_PENALTY_TOKENS:
|
||||||
if token not in occurrence:
|
if token not in occurrence:
|
||||||
occurrence[token] = 1
|
occurrence[token] = 1
|
||||||
else:
|
else:
|
||||||
|
Loading…
Reference in New Issue
Block a user