質問編集履歴

コードの位置

2022/10/19 01:19

投稿

mable

スコア2

title CHANGED Viewed

File without changes

body CHANGED Viewed

@@ -153,9 +153,9 @@
   num = num + 1
 dfh = pd.read_csv("point.csv",names=["cluster_id","latitude","longitude"])
-B = pd.read_csv("pps.csv",usecols=["#people"])
+B = pd.read_csv("pps.csv",usecols=["people"])
-#dfh2= pd.DataFrame(B['#people'])
+#dfh2= pd.DataFrame(B['people'])
-dfh['#people']= B
+dfh['people']= B
 dfh.to_csv("point.csv")
 ```

Python Excel

コードを戻した

2022/10/18 06:29

投稿

mable

スコア2

title CHANGED Viewed

File without changes

body CHANGED Viewed

@@ -49,9 +49,98 @@
 ```python
 ソースコード
+#1回目の訪問先の抽出
+from matplotlib import pyplot as plt
+from sklearn import datasets, preprocessing
+from sklearn.cluster import KMeans
+import numpy as np
+import pandas as pd
+import cartopy.crs as ccrs
+import cartopy.io.shapereader as shpreader
+pd.set_option('display.max_rows',600)
+#前処理後のcsvを読み込み
+yomi=pd.read_csv("simulationkai.csv")
+df=pd.read_csv("simulationkai.csv",usecols=["longitude","latitude"])
+# DataFrameに変換
+print(df.head())
+# データの整形
+X = df
+# クラスタリング
+cls = KMeans(n_clusters=4)
+result = cls.fit(X)
+X['cluster'] = result.labels_
+PC= pd.DataFrame(X['cluster'])
+PC
+df.head()
+#yomiのデータフレームにcluster(クラスタ番号)を追加する
+yomi['cluster_id']=PC
+yomi
+#yomi(元データにクラスタ番号を追加したもの)をallclsdata.csvに保存する
+yomi.to_csv("allclsdata.csv")
+D = X.sort_values(by="cluster")
+D = D.drop_duplicates(subset='cluster')
+D
+# 各クラスタ内のデータ数をカウント
+V = X['cluster'].value_counts()
+V
+# 各クラスタの番号とデータ数をclsvalue.csvに保存
+V.to_csv("clsvalue.csv")
+# クラスタの重心確認
+C = pd.DataFrame(result.cluster_centers_)
+C
+C.iloc[0, :]
+lat= X['latitude'].tolist()
+lon= X['longitude'].tolist()
+clat=C[0].tolist()
+clon=C[1].tolist()
+#から1800までのクラスタのデータからそれぞれ同じ被験者の重複を省いてデータ人数を取得して順番にCSVにまとめる
+from csv import writer
+#pp = pd.DataFrame
+#ppi =  pd.DataFrame
+#yomiからWhile文でN番目のクラスタのデータのみ抽出
+i = 0
+while i <= 3:
+  yomic = yomi[yomi['cluster_id']== i]
+#N番目のクラスタdfから被験者idの重複を消す
+  yomics = yomic.drop_duplicates(subset=["id_questionnaire"])
+#N番目の加工後データの行数をCSVに付け足す
+  #file = [i,len(yomics)]
+  #ppi = pp.append([file], ignore_index=True)
+  #ppi.to_csv("pp.csv")
+  list_data=[i,len(yomics)]
+  with open('pp.csv', 'a', newline='') as f_object:
+   writer_object = writer(f_object)
+   writer_object.writerow(list_data)
+   f_object.close()
+  i = i + 1
+#else:
+  #ppi.to_csv("pp.csv")
+#pp.csv内の人数を降順にしたものをpps.csvに保存
+PP = pd.read_csv("pp.csv",names=["cls","people"])
+T = PP.sort_values(by=["people"],ascending=False)
+T.to_csv("pps.csv")
+PP.to_csv("pp.csv")
 #pps.csvの上から順番にクラスタ番号を引き出してその番号の座標をCから引き出す
 num = 0
-while num <= 99:
+while num <= 3:
   Tn = T.iloc[num,0]
   #Tno = Tn + 1
   Cn = C.iloc[Tn,0]
@@ -64,9 +153,9 @@
   num = num + 1
 dfh = pd.read_csv("point.csv",names=["cluster_id","latitude","longitude"])
-B = pd.read_csv("pps.csv",usecols=["people"])
+B = pd.read_csv("pps.csv",usecols=["#people"])
-#dfh2= pd.DataFrame(B['people'])
+#dfh2= pd.DataFrame(B['#people'])
-dfh['people']= B
+dfh['#people']= B
 dfh.to_csv("point.csv")
 ```

Python Excel

最初のエラーを記載

2022/10/18 06:19

投稿

mable

スコア2

title CHANGED Viewed

File without changes

body CHANGED Viewed

@@ -13,43 +13,32 @@
 エラーメッセージ
->>> #pps.csvの上から順番にクラスタ番号を引き出してその番号の座標をCから引き出す
->>> num = 0
->>> while num <= 3:
-... Tn = T.iloc[num,0]
-... #Tno = Tn + 1
-... Cn = C.iloc[Tn,0]
-... Cn2 = C.iloc[Tn,1]
-... list_data2=[Tn,Cn,Cn2]
-... with open('point.csv', 'a', newline='') as f_object:
-... writer_object = writer(f_object)
+C:\datasyori>python hoge.py
-... writer_object.writerow(list_data2)
-... f_object.close()
-... num = num + 1
+    latitude   longitude
-...
+0  35.693590  139.712202
+1  35.693497  139.712096
+2  35.693217  139.712261
+3  35.693549  139.712430
+4  35.693621  139.712501
 Traceback (most recent call last):
-File "C:\Users\mable\AppData\Local\Programs\Python\Python310\lib\site-packages\pandas\core\indexing.py", line 769, in _validate_tuple_indexer
+  File "C:\Users\mable\AppData\Local\Programs\Python\Python310\lib\site-packages\pandas\core\indexing.py", line 769, in _validate_tuple_indexer
-self._validate_key(k, i)
+    self._validate_key(k, i)
-File "C:\Users\mable\AppData\Local\Programs\Python\Python310\lib\site-packages\pandas\core\indexing.py", line 1378, in _validate_key
+  File "C:\Users\mable\AppData\Local\Programs\Python\Python310\lib\site-packages\pandas\core\indexing.py", line 1378, in _validate_key
-raise ValueError(f"Can only index by location with a [{self._valid_types}]")
+    raise ValueError(f"Can only index by location with a [{self._valid_types}]")
 ValueError: Can only index by location with a [integer, integer slice (START point is INCLUDED, END point is EXCLUDED), listlike of integers, boolean array]
 The above exception was the direct cause of the following exception:
 Traceback (most recent call last):
-File "<stdin>", line 4, in <module>
+  File "C:\datasyori\hoge.py", line 95, in <module>
+    Cn = C.iloc[Tn,0]
-File "C:\Users\mable\AppData\Local\Programs\Python\Python310\lib\site-packages\pandas\core\indexing.py", line 961, in __getitem__
+  File "C:\Users\mable\AppData\Local\Programs\Python\Python310\lib\site-packages\pandas\core\indexing.py", line 961, in __getitem__
-return self._getitem_tuple(key)
+    return self._getitem_tuple(key)
-File "C:\Users\mable\AppData\Local\Programs\Python\Python310\lib\site-packages\pandas\core\indexing.py", line 1458, in _getitem_tuple
+  File "C:\Users\mable\AppData\Local\Programs\Python\Python310\lib\site-packages\pandas\core\indexing.py", line 1458, in _getitem_tuple
-tup = self._validate_tuple_indexer(tup)
+    tup = self._validate_tuple_indexer(tup)
-File "C:\Users\mable\AppData\Local\Programs\Python\Python310\lib\site-packages\pandas\core\indexing.py", line 771, in _validate_tuple_indexer
+  File "C:\Users\mable\AppData\Local\Programs\Python\Python310\lib\site-packages\pandas\core\indexing.py", line 771, in _validate_tuple_indexer
-raise ValueError(
+    raise ValueError(
 ValueError: Location based indexing can only have [integer, integer slice (START point is INCLUDED, END point is EXCLUDED), listlike of integers, boolean array] types
->>> dfh = pd.read_csv("point.csv",names=["cluster_id","latitude","longitude"])
->>> B = pd.read_csv("pps.csv",usecols=["people"])
->>> #dfh2= pd.DataFrame(B['people'])
->>> dfh['people']= B
->>> dfh.to_csv("point.csv")
 ```
@@ -59,95 +48,7 @@
 ```python
 ソースコード
-#1回目の訪問先の抽出
-from matplotlib import pyplot as plt
-from sklearn import datasets, preprocessing
-from sklearn.cluster import KMeans
-import numpy as np
-import pandas as pd
-import cartopy.crs as ccrs
-import cartopy.io.shapereader as shpreader
-pd.set_option('display.max_rows',600)
-#前処理後のcsvを読み込み
-yomi=pd.read_csv("simulationkai.csv")
-df=pd.read_csv("simulationkai.csv",usecols=["longitude","latitude"])
-# DataFrameに変換
-print(df.head())
-# データの整形
-X = df
-# クラスタリング
-cls = KMeans(n_clusters=100)
-result = cls.fit(X)
-X['cluster'] = result.labels_
-PC= pd.DataFrame(X['cluster'])
-PC
-df.head()
-#yomiのデータフレームにcluster(クラスタ番号)を追加する
-yomi['cluster_id']=PC
-yomi
-#yomi(元データにクラスタ番号を追加したもの)をallclsdata.csvに保存する
-yomi.to_csv("allclsdata.csv")
-D = X.sort_values(by="cluster")
-D = D.drop_duplicates(subset='cluster')
-D
-# 各クラスタ内のデータ数をカウント
-V = X['cluster'].value_counts()
-V
-# 各クラスタの番号とデータ数をclsvalue.csvに保存
-V.to_csv("clsvalue.csv")
-# クラスタの重心確認
-C = pd.DataFrame(result.cluster_centers_)
-C
-C.iloc[0, :]
-lat= X['latitude'].tolist()
-lon= X['longitude'].tolist()
-clat=C[0].tolist()
-clon=C[1].tolist()
-#から100までのクラスタのデータからそれぞれ同じ被験者の重複を省いてデータ人数を取得して順番にCSVにまとめる
-from csv import writer
-#pp = pd.DataFrame
-#ppi =  pd.DataFrame
-#yomiからWhile文でN番目のクラスタのデータのみ抽出
-i = 0
-while i <= 99:
-  yomic = yomi[yomi['cluster_id']== i]
-#N番目のクラスタdfから被験者idの重複を消す
-  yomics = yomic.drop_duplicates(subset=["id_questionnaire"])
-#N番目の加工後データの行数をCSVに付け足す
-  #file = [i,len(yomics)]
-  #ppi = pp.append([file], ignore_index=True)
-  #ppi.to_csv("pp.csv")
-  list_data=[i,len(yomics)]
-  with open('pp.csv', 'a', newline='') as f_object:
-   writer_object = writer(f_object)
-   writer_object.writerow(list_data)
-   f_object.close()
-  i = i + 1
-#else:
-  #ppi.to_csv("pp.csv")
-#pp.csv内の人数を降順にしたものをpps.csvに保存
-PP = pd.read_csv("pp.csv",names=["cls","people"])
-T = PP.sort_values(by=["people"],ascending=False)
-T.to_csv("pps.csv")
-PP.to_csv("pp.csv")
 #pps.csvの上から順番にクラスタ番号を引き出してその番号の座標をCから引き出す
 num = 0
 while num <= 99:
@@ -171,8 +72,7 @@
 ### 試したこと
-peopleの値がみつからないなどと書いてあったのでしっかりと確認しましたがデータにもあるのでよく理解できない。
-BがdefineなどあるがBの定義もしているのでどこが違うのでしょうか。
+勉強不足でエラーの内容が全く分かっていません
 ### 補足情報（FW/ツールのバージョンなど）
 Python 3.10.4 (tags/v3.10.4:9d38120, Mar 23 2022, 23:13:41) [MSC v.1929 64 bit (AMD64)] on win32

Python Excel

新たなコード

2022/10/18 05:17

投稿

mable

スコア2

title CHANGED Viewed

File without changes

body CHANGED Viewed

@@ -12,62 +12,43 @@
 ```python
 エラーメッセージ
-#pps.csvの上から順番にクラスタ番号を引き出してその番号の座標をCから引き出す
+>>> #pps.csvの上から順番にクラスタ番号を引き出してその番号の座標をCから引き出す
 >>> num = 0
->>> while num <= 99:
+>>> while num <= 3:
-...   Tn = T.iloc[num,0]
+... Tn = T.iloc[num,0]
-...   #Tno = Tn + 1
+... #Tno = Tn + 1
-...   Cn = C.iloc[Tn,0]
+... Cn = C.iloc[Tn,0]
-...   Cn2 = C.iloc[Tn,1]
+... Cn2 = C.iloc[Tn,1]
-...   list_data2=[Tn,Cn,Cn2]
+... list_data2=[Tn,Cn,Cn2]
-...   with open('point.csv', 'a', newline='') as f_object:
+... with open('point.csv', 'a', newline='') as f_object:
-...    writer_object = writer(f_object)
+... writer_object = writer(f_object)
-...    writer_object.writerow(list_data2)
+... writer_object.writerow(list_data2)
-...    f_object.close()
+... f_object.close()
-...   num = num + 1
+... num = num + 1
 ...
 Traceback (most recent call last):
-  File "C:\Users\mable\AppData\Local\Programs\Python\Python310\lib\site-packages\pandas\core\indexing.py", line 769, in _validate_tuple_indexer
+File "C:\Users\mable\AppData\Local\Programs\Python\Python310\lib\site-packages\pandas\core\indexing.py", line 769, in _validate_tuple_indexer
-    self._validate_key(k, i)
+self._validate_key(k, i)
-  File "C:\Users\mable\AppData\Local\Programs\Python\Python310\lib\site-packages\pandas\core\indexing.py", line 1378, in _validate_key
+File "C:\Users\mable\AppData\Local\Programs\Python\Python310\lib\site-packages\pandas\core\indexing.py", line 1378, in _validate_key
-    raise ValueError(f"Can only index by location with a [{self._valid_types}]")
+raise ValueError(f"Can only index by location with a [{self._valid_types}]")
 ValueError: Can only index by location with a [integer, integer slice (START point is INCLUDED, END point is EXCLUDED), listlike of integers, boolean array]
 The above exception was the direct cause of the following exception:
 Traceback (most recent call last):
-  File "<stdin>", line 4, in <module>
+File "<stdin>", line 4, in <module>
-  File "C:\Users\mable\AppData\Local\Programs\Python\Python310\lib\site-packages\pandas\core\indexing.py", line 961, in __getitem__
+File "C:\Users\mable\AppData\Local\Programs\Python\Python310\lib\site-packages\pandas\core\indexing.py", line 961, in __getitem__
-    return self._getitem_tuple(key)
+return self._getitem_tuple(key)
-  File "C:\Users\mable\AppData\Local\Programs\Python\Python310\lib\site-packages\pandas\core\indexing.py", line 1458, in _getitem_tuple
+File "C:\Users\mable\AppData\Local\Programs\Python\Python310\lib\site-packages\pandas\core\indexing.py", line 1458, in _getitem_tuple
-    tup = self._validate_tuple_indexer(tup)
+tup = self._validate_tuple_indexer(tup)
-  File "C:\Users\mable\AppData\Local\Programs\Python\Python310\lib\site-packages\pandas\core\indexing.py", line 771, in _validate_tuple_indexer
+File "C:\Users\mable\AppData\Local\Programs\Python\Python310\lib\site-packages\pandas\core\indexing.py", line 771, in _validate_tuple_indexer
-    raise ValueError(
+raise ValueError(
 ValueError: Location based indexing can only have [integer, integer slice (START point is INCLUDED, END point is EXCLUDED), listlike of integers, boolean array] types
 >>> dfh = pd.read_csv("point.csv",names=["cluster_id","latitude","longitude"])
->>> B = pd.read_csv("pps.csv",usecols=["#people"])
+>>> B = pd.read_csv("pps.csv",usecols=["people"])
-Traceback (most recent call last):
-  File "<stdin>", line 1, in <module>
-  File "C:\Users\mable\AppData\Local\Programs\Python\Python310\lib\site-packages\pandas\util\_decorators.py", line 311, in wrapper
-    return func(*args, **kwargs)
-  File "C:\Users\mable\AppData\Local\Programs\Python\Python310\lib\site-packages\pandas\io\parsers\readers.py", line 680, in read_csv
-    return _read(filepath_or_buffer, kwds)
-  File "C:\Users\mable\AppData\Local\Programs\Python\Python310\lib\site-packages\pandas\io\parsers\readers.py", line 575, in _read
-    parser = TextFileReader(filepath_or_buffer, **kwds)
-  File "C:\Users\mable\AppData\Local\Programs\Python\Python310\lib\site-packages\pandas\io\parsers\readers.py", line 933, in __init__
-    self._engine = self._make_engine(f, self.engine)
-  File "C:\Users\mable\AppData\Local\Programs\Python\Python310\lib\site-packages\pandas\io\parsers\readers.py", line 1235, in _make_engine
-    return mapping[engine](f, **self.options)
-  File "C:\Users\mable\AppData\Local\Programs\Python\Python310\lib\site-packages\pandas\io\parsers\c_parser_wrapper.py", line 131, in __init__
-    self._validate_usecols_names(usecols, self.orig_names)
-  File "C:\Users\mable\AppData\Local\Programs\Python\Python310\lib\site-packages\pandas\io\parsers\base_parser.py", line 913, in _validate_usecols_names
-    raise ValueError(
-ValueError: Usecols do not match columns, columns expected but not found: ['#people']
->>> #dfh2= pd.DataFrame(B['#people'])
+>>> #dfh2= pd.DataFrame(B['people'])
->>> dfh['#people']= B
+>>> dfh['people']= B
-Traceback (most recent call last):
-  File "<stdin>", line 1, in <module>
-NameError: name 'B' is not defined
 >>> dfh.to_csv("point.csv")
@@ -182,9 +163,9 @@
   num = num + 1
 dfh = pd.read_csv("point.csv",names=["cluster_id","latitude","longitude"])
-B = pd.read_csv("pps.csv",usecols=["#people"])
+B = pd.read_csv("pps.csv",usecols=["people"])
-#dfh2= pd.DataFrame(B['#people'])
+#dfh2= pd.DataFrame(B['people'])
-dfh['#people']= B
+dfh['people']= B
 dfh.to_csv("point.csv")
 ```

Python Excel