๋๋ ๋ค์์ด ๋ฒ๊ทธ๋ผ๊ณ ํ์ ํ์ง๋ง ๊ทธ๋ ์ง ์์ ๊ฒฝ์ฐ ์๋ ค์ฃผ์ธ์. ํด๊ฒฐ์ฑ ์ ๋๋จํ ๊ฐ์ฌํ๊ฒ ์ต๋๋ค.
์ ๋ SCKlearn์ ํตํด ํ์ค ์ ํซ ์ธ์ฝ๋ฉ์ ์ํํ๊ณ ์์ผ๋ฉฐ ๊ทธ ๊ณผ์ ์์ ๋ถ๋ช
ํ Numpy๋ฅผ ์ฌ์ฉํ๊ณ ์์ต๋๋ค. ์ธ์ ์ต์
์ ๊ธฐ๋ณธ๊ฐ์ผ๋ก ๋๋ฉด ๋ชจ๋ ๋ฌธ์ ๊ฐ ์์ง๋ง numpy.set_printoptions(threshold='nan')
ํจ์๋ฅผ ์ฌ์ฉํ์ฌ ํ๋์ ํซ ์ธ์ฝ๋ฉ ๋ฐฐ์ด(Numpy ์์ฝ ๋์ ) ์ ์ฒด๋ฅผ ์ธ์ํ๋ฉด ๋ฌธ์ ์ ๋ชฉ์ ์ค๋ฅ๊ฐ ๋ฐ์ํฉ๋๋ค. ๋ค์์ ์ฝ๋์ ํด๋น ์ค๋ฅ/์ถ์ ๋ณด๊ณ ์์
๋๋ค.
import numpy
from numpy import array
from numpy import argmax
from sklearn.preprocessing import LabelEncoder
from sklearn.preprocessing import OneHotEncoder
data = "+++++++++QVQLVQSGGGVVQPGRSLRLSCAASGFTFSSHRMHWVRQAPGKGLEWVAAVSNDGSNEYYADSVKGRFTISRDKSTSTLYLQMDSLRPEDTAVYYCARERCVSSSCWARALDYWGQGSLVTVCS++++++++++"
seq_string = list(data)
print(seq_string)
values = array(seq_string)
print(values)
label_encoder = LabelEncoder()
integer_encoded = label_encoder.fit_transform(values)
print(integer_encoded)
onehot_encoder = OneHotEncoder(sparse=False)
integer_encoded = integer_encoded.reshape(len(integer_encoded), 1)
onehot_encoded = onehot_encoder.fit_transform(integer_encoded)
numpy.set_printoptions(threshold='nan')
print(onehot_encoded)
inverted = label_encoder.inverse_transform([argmax(onehot_encoded[1, :])])
print(inverted)
> ---------------------------------------------------------------------------
TypeError Traceback (most recent call last)
<ipython-input-1-43683b44d2e3> in <module>()
24 onehot_encoded = onehot_encoder.fit_transform(integer_encoded)
25 numpy.set_printoptions(threshold='nan')
---> 26 print(onehot_encoded)
27 # invert first example
28 inverted = label_encoder.inverse_transform([argmax(onehot_encoded[1, :])])
/d/harpy1/s/python/v3-5.1.0/lib/python3.6/site-packages/numpy/core/arrayprint.py in array_str(a, max_line_width, precision, suppress_small)
1400 return str(a[()])
1401
-> 1402 return array2string(a, max_line_width, precision, suppress_small, ' ', "")
1403
1404 def set_string_function(f, repr=True):
/d/harpy1/s/python/v3-5.1.0/lib/python3.6/site-packages/numpy/core/arrayprint.py in array2string(a, max_line_width, precision, suppress_small, separator, prefix, style, formatter, threshold, edgeitems, sign, floatmode, suffix, **kwarg)
620 return "[]"
621
--> 622 return _array2string(a, options, separator, prefix)
623
624
/d/harpy1/s/python/v3-5.1.0/lib/python3.6/site-packages/numpy/core/arrayprint.py in wrapper(self, *args, **kwargs)
420 repr_running.add(key)
421 try:
--> 422 return f(self, *args, **kwargs)
423 finally:
424 repr_running.discard(key)
/d/harpy1/s/python/v3-5.1.0/lib/python3.6/site-packages/numpy/core/arrayprint.py in _array2string(a, options, separator, prefix)
435 data = asarray(a)
436
--> 437 if a.size > options['threshold']:
438 summary_insert = "..."
439 data = _leading_trailing(data, options['edgeitems'])
TypeError: '>' not supported between instances of 'int' and 'str'
๋์ threshold=sys.maxsize
๋ฅผ ์๋ํ์ญ์์ค. threshold
๋ int
๋ก ๋ฌธ์ํ๋์ด ์์ต๋๋ค.
์ฌ๋๋ค์ด "nan" ๋ฌธ์์ด์ ์ ๋ฌํ ๋ 1.16์์ ์์ธ๋ฅผ ๋์ง๊ธฐ ์์ํ์ฌ ํ์ด์ฌ 3์ ์ค๋นํด์ผ ํ ๊น์?
๋ถํํ๋ stackoverflow๋ 'nan'์ ์ ๋ฌํ ๊ฒ์ ๊ถ์ฅํฉ๋๋ค.
SO ์๋ชป๋ ์ ๋ณด ๋งํฌ: https://stackoverflow.com/questions/1987694/how-to-print-the-full-numpy-array
๋์
threshold=sys.maxsize
๋ฅผ ์๋ํ์ญ์์ค.threshold
๋int
๋ก ๋ฌธ์ํ๋์ด ์์ต๋๋ค.
๊ฐ์ฌํฉ๋๋ค! ๊ทธ๊ฒ์ ์๋ฒฝํ๊ฒ ์ ์๋ํ์ต๋๋ค.
์ค์ ๋ก ๋ฌธ์ ๋ ์ธ๊ธ๋ SO ๋งํฌ๋ฅผ ๋ฐ๋ผ ๋ฐ์ํ์ต๋๋ค.
๊ฐ์ฅ ์ ์ฉํ ๋๊ธ
๋์
threshold=sys.maxsize
๋ฅผ ์๋ํ์ญ์์ค.threshold
๋int
๋ก ๋ฌธ์ํ๋์ด ์์ต๋๋ค.