from tensorflow.keras.datasets import imdb

def get(vocavbulary):
    (X_train, y_train), (X_test, y_test) = imdb.load_data(num_words=vocavbulary)
    word_index = imdb.get_word_index()
    index_word = {index: word for word, index in word_index.items()}

    def decode_review(encoded_review):
        return ' '.join([index_word.get(i - 3, '?') for i in encoded_review])

    # Convert integer sequences back to text
    X_train_text = [decode_review(review) for review in X_train]
    X_test_text = [decode_review(review) for review in X_test]
    return y_train,y_test,X_train_text,X_test_text