Fixed a distance bug.

Kalvar · Kalvar · commit 7852d274b90b · 2015-10-18T23:02:55.000+08:00
diff --git a/KRKmeans.podspec b/KRKmeans.podspec
@@ -1,6 +1,6 @@
 Pod::Spec.new do |s|
   s.name         = "KRKmeans"
-  s.version      = "2.4"
+  s.version      = "2.4.1"
   s.summary      = "KRKmeans is clustering algorithm (クラスタリング分類) that one of Machine Learning methods."
   s.description  = <<-DESC
                    KRKmeans has implemented K-Means the clustering algorithm (クラスタリング分類) and achieved multi-dimensional clustering in this project. KRKmeans could be used in data mining (データマイニング), image compression (画像圧縮) and classification.
diff --git a/KRKmeans.xcodeproj/project.xcworkspace/xcuserdata/Kalvar.xcuserdatad/UserInterfaceState.xcuserstate b/KRKmeans.xcodeproj/project.xcworkspace/xcuserdata/Kalvar.xcuserdatad/UserInterfaceState.xcuserstate
diff --git a/KRKmeans/AppDelegate.h b/KRKmeans/AppDelegate.h
@@ -1,6 +1,6 @@
 //
 //  AppDelegate.h
-//  KRKmeans V2.4
+//  KRKmeans V2.4.1
 //
 //  Created by Kalvar on 2014/6/29.
 //  Copyright (c) 2014 - 2015年 Kalvar Lin, ilovekalvar@gmail.com. All rights reserved.
diff --git a/KRKmeans/AppDelegate.m b/KRKmeans/AppDelegate.m
@@ -1,6 +1,6 @@
 //
 //  AppDelegate.m
-//  KRKmeans V2.4
+//  KRKmeans V2.4.1
 //
 //  Created by Kalvar on 2014/6/29.
 //  Copyright (c) 2014 - 2015年 Kalvar Lin, ilovekalvar@gmail.com. All rights reserved.
diff --git a/KRKmeans/ViewController.h b/KRKmeans/ViewController.h
@@ -1,6 +1,6 @@
 //
 //  ViewController.h
-//  KRKmeans V2.4
+//  KRKmeans V2.4.1
 //
 //  Created by Kalvar on 2014/6/29.
 //  Copyright (c) 2014 - 2015年 Kalvar Lin, ilovekalvar@gmail.com. All rights reserved.
diff --git a/KRKmeans/ViewController.m b/KRKmeans/ViewController.m
@@ -1,6 +1,6 @@
 //
 //  ViewController.m
-//  KRKmeans V2.4
+//  KRKmeans V2.4.1
 //
 //  Created by Kalvar on 2014/6/29.
 //  Copyright (c) 2014 - 2015年 Kalvar Lin, ilovekalvar@gmail.com. All rights reserved.
diff --git a/KRKmeans/main.m b/KRKmeans/main.m
@@ -1,6 +1,6 @@
 //
 //  main.m
-//  KRKmeans V2.4
+//  KRKmeans V2.4.1
 //
 //  Created by Kalvar on 2014/6/29.
 //  Copyright (c) 2014 - 2015年 Kalvar Lin, ilovekalvar@gmail.com. All rights reserved.
diff --git a/KRKmeansTests/KRKmeansTests.m b/KRKmeansTests/KRKmeansTests.m
@@ -1,6 +1,6 @@
 //
-//  KRKmeans V2.4Tests.m
-//  KRKmeans V2.4Tests
+//  KRKmeans V2.4.1Tests.m
+//  KRKmeans V2.4.1Tests
 //
 //  Created by Kalvar on 2014/6/29.
 //  Copyright (c) 2014 - 2015年 Kalvar Lin, ilovekalvar@gmail.com. All rights reserved.
diff --git a/ML/KRKmeans.h b/ML/KRKmeans.h
@@ -1,13 +1,13 @@
 //
 //  KRKmeans.h
-//  KRKmeans V2.4
+//  KRKmeans V2.4.1
 //
 //  Created by Kalvar on 2014/6/30.
 //  Copyright (c) 2014 - 2015年 Kalvar Lin, ilovekalvar@gmail.com. All rights reserved.
 //
 /*
  * @ K-Means
- *   - 條件為 :
+ *   - 演譯原則 :
  *     1. 求出 A 集合與 B 集合之中心位置，或將 A, B 集合直接當成初始群聚中心點 (如果該集合裡只有 1 組資料時)
  *     2. 將 C 集合依 K-Means 理論放置於 A 與 B 集合裡。
  *
@@ -18,14 +18,17 @@
  *     4. 迭代運算，將其重新計算每群聚中心點，再重新分群，直至 MIN(新舊中心點誤差值) 小於設定值或與上次群聚中心點相等時，即停止 1 ~ 3 步驟的迭代運算。
  *     5. 使用 SSE 來評估每一次的分群結果，把每一次分群後的結果 SSE 值記錄起來，再逐步去調整起始中心點，直至比較出最小的 SSE 值，則該群聚結果即為最佳解。
  *
- *   - K-Means 就是將相關聯( 例如距離最近、數字相關、倍數相關、特徵點相關等 )的數字分類在一起，
- *     而後再依照分群結果去做對應結果的方法。
+ *   - K-Means 就是將相關聯( 例如距離最近、數字相關、倍數相關、特徵點相關等 )的數字分類在一起，而後再依照分群結果去做對應結果的方法。
  *
  *   - 已擴充 :
  *     1. 將一群隨機產生的 100 組 (x, y) 2 維資料集合，先做分群分類成 N 組集合群聚( N 可自訂 )。
  *     2. 再做現在將 C 集合分群的動作。
  *     3. 進行分群迭代運算，將每一個分類好的群組重新分群
  *
+ *   - 距離公式說明 :
+ *     1. Cosine Similarity 是種歸屬度的概念，數字越大代表越相近 ( 或是用 1 - 歸屬度，取其差值，就能跟距離概念一樣越小越近了 )
+ *     2. Euclidean Distance 是距離的概念，數字越小代表越相近
+ *
  */
 
 #import <Foundation/Foundation.h>
diff --git a/ML/KRKmeans.m b/ML/KRKmeans.m
@@ -1,6 +1,6 @@
 //
 //  KRKmeans.m
-//  KRKmeans V2.4
+//  KRKmeans V2.4.1
 //
 //  Created by Kalvar on 2014/6/30.
 //  Copyright (c) 2014 - 2015年 Kalvar Lin, ilovekalvar@gmail.com. All rights reserved.
@@ -84,7 +84,7 @@ -(float)_distanceEuclidean2PointsX1:(NSArray *)_x1 x2:(NSArray *)_x2
                  powf([[_x1 lastObject] floatValue] - [[_x2 lastObject] floatValue], 2));
 }
 
-// Euclidean distance which multi-dimensional formula
+// Euclidean distance which multi-dimensional formula, 距離越小越近
 -(float)_distanceEuclideanX1:(NSArray *)_x1 x2:(NSArray *)_x2
 {
     NSInteger _index = 0;
@@ -98,7 +98,7 @@ -(float)_distanceEuclideanX1:(NSArray *)_x1 x2:(NSArray *)_x2
     return (_index > 0) ? sqrtf(_sum) : _sum;
 }
 
-// Cosine Similarity method that multi-dimensional
+// Cosine Similarity method that multi-dimensional, 同歸屬度越大越近
 -(float)_distanceCosineSimilarityX1:(NSArray *)_x1 x2:(NSArray *)_x2
 {
     float _sumA  = 0.0f;
@@ -115,9 +115,11 @@ -(float)_distanceCosineSimilarityX1:(NSArray *)_x1 x2:(NSArray *)_x2
         _sumAB        += ( _aValue * _bValue );
         ++_index;
     }
-    return ( _sumAB / sqrtf( _sumA * _sumB ) );
+    float _ab = _sumA * _sumB;
+    return ( _ab > 0.0f ) ? ( _sumAB / sqrtf( _ab ) ) : 0.0f;
 }
 
+// 距離概念是越小越近，歸屬度概念是越大越近 ( 或取其差值，使歸屬度同距離越小越近 )
 -(float)_distanceX1:(NSArray *)_x1 x2:(NSArray *)_x2
 {
     float _distance = 0.0f;
@@ -127,7 +129,7 @@ -(float)_distanceX1:(NSArray *)_x1 x2:(NSArray *)_x2
             _distance = [self _distanceEuclidean2PointsX1:_x1 x2:_x2];
             break;
         case KRKmeansDimensionalMultiByCosine:
-            _distance = [self _distanceCosineSimilarityX1:_x1 x2:_x2];
+            _distance = 1.0f - [self _distanceCosineSimilarityX1:_x1 x2:_x2];
             break;
         case KRKmeansDimensionalMultiByEuclidean:
             _distance = [self _distanceEuclideanX1:_x1 x2:_x2];
@@ -170,10 +172,9 @@ -(NSMutableArray *)_clusterSources:(NSArray *)_sources compareCenters:(NSArray *
                 //個別求出要分群的集合跟其它集合體的距離
                 float _distance = [self _distanceX1:_xySets x2:_eachSets];
                 //比較出最小的距離，即為歸納分群的對象
-                //是第 1 筆 || 當前距離 < 上一次的距離
+                //是第 1 筆 || 當前距離 < 上一次的距離 ( 如距離為歸屬度，則因已在 _distanceX1:X2 裡使用了差值運算，故這裡一樣使用 < 即可 )
                 if( _index == 0 || _distance < _lastDistance )
                 {
-                    //記錄起來
                     _lastDistance = _distance;
                     _closeIndex   = _index;
                 }
diff --git a/ML/KRKmeansOne.h b/ML/KRKmeansOne.h
@@ -1,6 +1,6 @@
 //
-//  KRKmeans V2.4.h
-//  KRKmeans V2.4
+//  KRKmeans V2.4.1.h
+//  KRKmeans V2.4.1
 //
 //  Created by Kalvar on 2014/6/29.
 //  Copyright (c) 2014 - 2015年 Kalvar Lin, ilovekalvar@gmail.com. All rights reserved.
diff --git a/ML/KRKmeansOne.m b/ML/KRKmeansOne.m
@@ -1,6 +1,6 @@
 //
-//  KRKmeans V2.4.m
-//  KRKmeans V2.4
+//  KRKmeans V2.4.1.m
+//  KRKmeans V2.4.1
 //
 //  Created by Kalvar on 2014/6/29.
 //  Copyright (c) 2014 - 2015年 Kalvar Lin, ilovekalvar@gmail.com. All rights reserved.
diff --git a/ML/NSArray+Statistics.h b/ML/NSArray+Statistics.h
@@ -1,6 +1,6 @@
 //
 //  NSArray+Statistics.h
-//  KRKmeans V2.4
+//  KRKmeans V2.4.1
 //
 //  Created by Kalvar on 2014/6/29.
 //  Copyright (c) 2014 - 2015年 Kalvar Lin, ilovekalvar@gmail.com. All rights reserved.
diff --git a/README.md b/README.md
@@ -7,7 +7,7 @@ KRKmeans has implemented K-Means the clustering algorithm (クラスタリング
 
 ```ruby
 platform :ios, '7.0'
-pod "KRKmeans", "~> 2.4"
+pod "KRKmeans", "~> 2.4.1"
 ```
 
 ## How to use
@@ -174,7 +174,7 @@ If you have trained clusters that you could directly put new patterns into direc
 
 ## Version
 
-V2.4
+V2.4.1
 
 ## License