import nltk
nltk.download('wordnet')

from nltk.corpus import wordnet as wn

print('Synsets for the word "invite" in WordNet:\n\n', wn.synsets('invite'))

Synsets for the word "invite" in WordNet:

 [Synset('invite.n.01'), Synset('invite.v.01'), Synset('invite.v.02'), Synset('tempt.v.03'), Synset('invite.v.04'), Synset('invite.v.05'), Synset('invite.v.06'), Synset('invite.v.07'), Synset('receive.v.05')]

# We can constrain the search by specifying the part of speech
# parts of speech available: ADJ, ADV, ADJ_SAT, NOUN, VERB
# ADJ_SAT: see https://stackoverflow.com/questions/18817396/what-part-of-speech-does-s-stand-for-in-wordnet-synsets

# Way one
print(f'{"-"*20}Way one{"-"*20}')
print('Synsets for the noun "invite" in WordNet:\n\n', wn.synsets('invite', pos=wn.NOUN))

# Way two
print(f'\n\n{"-"*20}Way two{"-"*20}')
# pos: {'n':'noun', 'v':'verb', 's':'adj (s)', 'a':'adj', 'r':'adv'}
print('Synsets for the noun "invite" in WordNet:\n\n', [s for s in wn.synsets('invite') if s.pos()=='n'])

--------------------Way one--------------------
Synsets for the noun "invite" in WordNet:

 [Synset('invite.n.01')]


--------------------Way two--------------------
Synsets for the noun "invite" in WordNet:

 [Synset('invite.n.01')]

# check definition of a synset
print(f'{"-"*20}Definition{"-"*20}')
print('The definition for invite as a noun:\n\n', wn.synset('invite.n.01').definition())

# check the related examples
print(f'\n\n{"-"*20}Examples{"-"*20}')
print('The definition for invite as a noun:\n\n', wn.synset('invite.n.01').examples())

# check the hypernyms
print(f'\n\n{"-"*20}Hypernyms{"-"*20}')
print('The hypernyms for invite as a noun:\n\n', wn.synset('invite.n.01').hypernyms())

--------------------Definition--------------------
The definition for invite as a noun:

 a colloquial expression for invitation


--------------------Examples--------------------
The definition for invite as a noun:

 ["he didn't get no invite to the party"]


--------------------Hypernyms--------------------
The hypernyms for invite as a noun:

 [Synset('invitation.n.01')]

dog = wn.synset('dog.n.01')
cat = wn.synset('cat.n.01')
print('The path similarity between cat(noun) and dog(noun): ', dog.path_similarity(cat))

The path similarity between cat(noun) and dog(noun):  0.2

# Likelihood Function 

import numpy as np

def likelihood(X, theta):
    """
    Computes the likelihood function for given data X and parameter theta.
    Assumes a Gaussian likelihood with mean=theta and variance=1.
    """
    return np.prod(1 / np.sqrt(2 * np.pi) * np.exp(-0.5 * (X - theta)**2))

# Example Usage
np.random.seed(42)
X = np.random.normal(loc=5, scale=2, size=100)  # Sample data from Gaussian

theta_test = 5.0
likelihood_val = likelihood(X, theta_test)
print("Likelihood:", likelihood_val)

Likelihood: 1.7064553444710973e-112

# Negative Log-Likelihood Function
def negative_log_likelihood(X, theta):
    """
    Computes the Negative Log-Likelihood (NLL) for a Gaussian distribution.
    """
    return -np.sum(-0.5 * (X - theta)**2 - 0.5 * np.log(2 * np.pi))

nll_val = negative_log_likelihood(X, theta_test)
print("Negative Log-Likelihood:", nll_val)

Negative Log-Likelihood: 257.3551120942153

# Prediction Function
def softmax(x):
    """
    Computes the softmax function for an array x.
    """
    exp_x = np.exp(x - np.max(x))  # For numerical stability
    return exp_x / exp_x.sum()

def predict_probabilities(word_vector, context_vector, vocabulary):
    """
    Computes P(o|c) using softmax, given word embeddings.
    """
    scores = np.dot(vocabulary, context_vector)  # Dot product with all words
    return softmax(scores)


# Prediction Example
vocab_size = 10
embedding_dim = 5
vocabulary = np.random.rand(vocab_size, embedding_dim)  # Fake word embeddings
context_vector = np.random.rand(embedding_dim)
probabilities = predict_probabilities(vocabulary, context_vector, vocabulary)
print("Prediction Probabilities:", probabilities)

Prediction Probabilities: [0.07444069 0.13176847 0.10419385 0.06380236 0.10424873 0.11576871
 0.11774626 0.06498345 0.09594868 0.12709881]

Lecture 1 : intro and Word Vectors¶

TL;DR¶

Meaning of a Word¶

Wordnet¶

Discrete Symbols¶

WordNet¶

WordNet Example¶

Limitations¶

Word Vectors(AKA Embeddings)¶

Word2vec¶

Objective Function¶

Prediction function¶

Softmax function¶

Optimization¶