Gensim Word2Vec model on the WA Strats data
print(word_vectors.similarity('sedimentary', 'rock')) 0.244842896713 print(word_vectors.similarity('sandstone', 'rhyolite')) 0.164117527643 print(word_vectors.similarity('sandstone', 'rock')) 0.210323180918
word_vectors.most_similar('rock')
[('felsic', 0.39053836464881897), ('mafic', 0.29245898127555847), ('quartz', 0.2764042317867279), ('and', 0.27265167236328125), ('volcanic', 0.2520792782306671), ('sedimentary', 0.24484288692474365), ('-', 0.24219940602779388), ('metamorphics', 0.23966048657894135), ('granulite-facies', 0.23941434919834137), ('group', 0.23868629336357117)] word_vectors.most_similar('sandstone') Out[83]: [('hill', 0.3171369433403015), ('range', 0.2612810730934143), ('complex', 0.2158491462469101), ('point', 0.21551984548568726), ('archean', 0.21121595799922943), ('rock', 0.21032318472862244), ('formation,', 0.19128333032131195), ('siltstone', 0.17484164237976074), ('sedimentary', 0.17313337326049805), ('rhyolite', 0.16411754488945007)]