Unicodeのコードポイント頻度測定

以下のコードをprint()で確認すると，以下の結果になったのですが，
#質問内容①
これは，何を表しているのですか？

#質問内容②
各要素を文字数で正規化するのは，何のために行っているのですか？

お手数をお掛けしますが，回答お願い致します．
一番下に，全体のコードを記載しています．

#質問箇所

Python
1#Unicodeのコードポイント頻度測定
2def count_codePoint(str):
3    #Unicodeのコードポイントをアドレスをする配列を用意
4    counter = np.zeros(65535)
5    
6    for i in range(len(str)):
7        #各文字をUnicodeのコードポイントに変換
8        code_point = ord(str[i])
9        if code_point>65535:
10            continue
11        #対応するアドレスの出現回数をインクリメント
12        counter[code_point] +=1
13　　　　#上のコードが何を表しているのかを確認する為に，print()を行った．
14        print(i)
15        print(code_point)
16        print(counter[code_point],"\n")
17   
18

#結果

#全体のコード

Python
1コード
2##利用されている文字が異なる言語を判定###
3import numpy as np
4from sklearn.naive_bayes import GaussianNB
5from sklearn.metrics import accuracy_score
6
7#Unicodeのコードポイント頻度測定
8def count_codePoint(str):
9    #Unicodeのコードポイントをアドレスをする配列を用意
10    counter = np.zeros(65535)
11    
12    for i in range(len(str)):
13        #各文字をUnicodeのコードポイントに変換
14        code_point = ord(str[i])
15        if code_point>65535:
16            continue
17        #対応するアドレスの出現回数をインクリメント
18        counter[code_point] +=1
19        print(i)
20        print(code_point)
21        print(counter[code_point],"\n")
22    
23    
24    #各要素を文字数で割って正規化
25    counter = counter/len(str)
26    return counter
27
28#学習用データの準備
29ja_str = "これは日本語の文章です。"
30en_str = "This is English Sentences."
31th_str = 'นี่เป็นประโยคภาษาไทย'
32
33x_train = [count_codePoint(ja_str),count_codePoint(en_str),count_codePoint(th_str)]
34"""
35print(x_train)
36"""
37y_train = ["ja","en",'th']
38
39#学習する
40clf = GaussianNB()
41clf.fit(x_train,y_train)
42
43#評価データの準備
44ja_test_str = "こんにちは"
45en_test_str = "Hello"
46th_test_str = 'สวัสดี'
47
48x_test = [count_codePoint(en_test_str),count_codePoint(th_test_str),count_codePoint(ja_test_str)]
49"""
50print(x_test)
51"""
52y_test = ["en",'th',"ja"]
53
54#評価する
55y_pred = clf.predict(x_test)
56print(y_pred)
57print("正解率=",accuracy_score(y_test,y_pred))