Skip to content
Snippets Groups Projects
Commit 3a30f7f3 authored by Mingchung Xia's avatar Mingchung Xia
Browse files

Minor comment changes

parent 7e892787
No related branches found
No related tags found
1 merge request!13HNSW Implementation with Testcases
...@@ -27,7 +27,7 @@ import PriorityHeapAlgorithms ...@@ -27,7 +27,7 @@ import PriorityHeapAlgorithms
import SimilarityMetric import SimilarityMetric
import HNSWAlgorithm import HNSWAlgorithm
import HNSWEphemeral import HNSWEphemeral
import GameplayKit /// Not avaliable on Linux? import GameplayKit // Not avaliable on Linux? - try to change to other random
class HNSWCorpus<Scalar: BinaryFloatingPoint & Codable>: SNLPCorpus { class HNSWCorpus<Scalar: BinaryFloatingPoint & Codable>: SNLPCorpus {
...@@ -36,9 +36,11 @@ class HNSWCorpus<Scalar: BinaryFloatingPoint & Codable>: SNLPCorpus { ...@@ -36,9 +36,11 @@ class HNSWCorpus<Scalar: BinaryFloatingPoint & Codable>: SNLPCorpus {
var zeroes: [Scalar] var zeroes: [Scalar]
var count: Int { 0 } var count: Int { 0 }
/// typicalNeighbourhoodSize = 20 is a standard benchmark // typicalNeighbourhoodSize = 20 is a standard benchmark
var encodedDocuments: DeterministicSampleVectorIndex = DeterministicSampleVectorIndex<[Scalar]>(typicalNeighborhoodSize: 20) var encodedDocuments: DeterministicSampleVectorIndex = DeterministicSampleVectorIndex<[Scalar]>(typicalNeighborhoodSize: 20)
// Map from Key to documentId - similar to DictionaryCorpus
init(_documentEncoder: ContextFreeEncoder<Scalar>) { init(_documentEncoder: ContextFreeEncoder<Scalar>) {
self._documentEncoder = _documentEncoder self._documentEncoder = _documentEncoder
zeroes = Array(repeating: Scalar(0), count: 384) zeroes = Array(repeating: Scalar(0), count: 384)
...@@ -46,15 +48,13 @@ class HNSWCorpus<Scalar: BinaryFloatingPoint & Codable>: SNLPCorpus { ...@@ -46,15 +48,13 @@ class HNSWCorpus<Scalar: BinaryFloatingPoint & Codable>: SNLPCorpus {
@inlinable @inlinable
func addUntokenizedDocument(_ document: String) { func addUntokenizedDocument(_ document: String) {
/// Forced cast to [Scalar] is unnecessary encodedDocuments.insert((_documentEncoder.encodeSentence(document))) /// as! [Scalar] not needed
encodedDocuments.insert((_documentEncoder.encodeSentence(document)))
} }
} }
public struct DeterministicSampleVectorIndex<Vector: Collection & Codable> where Vector.Element: BinaryFloatingPoint { public struct DeterministicSampleVectorIndex<Vector: Collection & Codable> where Vector.Element: BinaryFloatingPoint {
/// EmphermalVectorIndex<Key: BinaryInteger, Level: BinaryInteger, Metric: SimilarityMetric, Metadata>
public typealias Index = EphemeralVectorIndex<Int, Int, CartesianDistanceMetric<Vector>, Void> public typealias Index = EphemeralVectorIndex<Int, Int, CartesianDistanceMetric<Vector>, Void>
public var base: Index public var base: Index
...@@ -78,8 +78,7 @@ public struct DeterministicSampleVectorIndex<Vector: Collection & Codable> where ...@@ -78,8 +78,7 @@ public struct DeterministicSampleVectorIndex<Vector: Collection & Codable> where
public mutating func insert(_ vector: Vector) { public mutating func insert(_ vector: Vector) {
let convertedVector: [Double] = vector.map{ Double($0) } let convertedVector: [Double] = vector.map{ Double($0) }
if let metricVector = convertedVector as? CartesianDistanceMetric<Vector>.Vector { if let metricVector = convertedVector as? CartesianDistanceMetric<Vector>.Vector {
/// Returns a Key (unused) base.insert(metricVector, using: &graphRNG) /// returns an unused 'Key' type
base.insert(metricVector, using: &graphRNG)
} else { } else {
fatalError("Unable to get metric vector") fatalError("Unable to get metric vector")
} }
...@@ -97,6 +96,7 @@ public struct CartesianDistanceMetric<Vector: Collection & Codable>: SimilarityM ...@@ -97,6 +96,7 @@ public struct CartesianDistanceMetric<Vector: Collection & Codable>: SimilarityM
} }
struct DeterministicRandomNumberGenerator: RandomNumberGenerator { struct DeterministicRandomNumberGenerator: RandomNumberGenerator {
// Try another package for this...
private let randomSource: GKMersenneTwisterRandomSource private let randomSource: GKMersenneTwisterRandomSource
init(seed: UInt64) { init(seed: UInt64) {
......
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment