def joke_distance(jokeOneID, jokeTwoID, sqlContext, p=2):
    jokeOneTopics = sqlContext.sql(
        "SELECT topicDistribution FROM jokes WHERE jokeID = {jokeOneID}".
        format(jokeOneID=jokeOneID))
    jokeTwoTopics = sqlContext.sql(
        "SELECT topicDistribution FROM jokes WHERE jokeID = {jokeTwoID}".
        format(jokeTwoID=jokeTwoID))
    joke_disparity = jokeOneTopics.subtract(jokeTwoTopics)
    return Vectors.norm(joke_disparity.rdd.first().topicDistribution,
                        p)**(1 / p)