dataframe take head() to list and append

what I am trying to do is taking the top 6 most relevant books from my csv of 8371 books. I did take out the top 6 books and i would like to do a for loop so i can get all my 8371 books with a list of 6 more relevant books append next to every book

def tf_similarity(s1, s2):

def add_space(s):

    return ' '.join(list(s))



s1, s2 = add_space(s1), add_space(s2)



cv = CountVectorizer(tokenizer=lambda s: s.split())

corpus = [s1, s2]

vectors = cv.fit_transform(corpus).toarray()



return np.dot(vectors[0], vectors[1]) / (norm(vectors[0]) * norm(vectors[1]))

for j in range(0,1):

for i in range(8371):

    titles.append(tf_similarity(str(document[i]), document[j]))





df = pd.DataFrame()

df["document"] = document

df["titles"] = titles

dff = df.sort_values("titles", ascending=False).head(6)

newdff=dff.values.T.tolist()

new=newdff[0]

for k in range(0,2):
boolist.append(new)

I would like my list look something like this:
book1 top1 top2 top3 top4 top5 top6
book2 top1 top2 top3 top4 top5 top6
Thank you so much for helping :)

edited Nov 25 '18 at 3:44

asked Nov 25 '18 at 0:54

Irene

Please edit your code to make it properly indented so others will read and help you. Use 4 indents into the right to make it a code. Also use Python-specific indentation within your code to make it readable.

– dmitryro
Nov 25 '18 at 0:56

add a comment |

def tf_similarity(s1, s2):

def add_space(s):

    return ' '.join(list(s))



s1, s2 = add_space(s1), add_space(s2)



cv = CountVectorizer(tokenizer=lambda s: s.split())

corpus = [s1, s2]

vectors = cv.fit_transform(corpus).toarray()



return np.dot(vectors[0], vectors[1]) / (norm(vectors[0]) * norm(vectors[1]))

for j in range(0,1):

for i in range(8371):

    titles.append(tf_similarity(str(document[i]), document[j]))





df = pd.DataFrame()

df["document"] = document

df["titles"] = titles

dff = df.sort_values("titles", ascending=False).head(6)

newdff=dff.values.T.tolist()

new=newdff[0]

for k in range(0,2):
boolist.append(new)

I would like my list look something like this:
book1 top1 top2 top3 top4 top5 top6
book2 top1 top2 top3 top4 top5 top6
Thank you so much for helping :)

edited Nov 25 '18 at 3:44

asked Nov 25 '18 at 0:54

Irene

Please edit your code to make it properly indented so others will read and help you. Use 4 indents into the right to make it a code. Also use Python-specific indentation within your code to make it readable.

– dmitryro
Nov 25 '18 at 0:56

add a comment |

def tf_similarity(s1, s2):

def add_space(s):

    return ' '.join(list(s))



s1, s2 = add_space(s1), add_space(s2)



cv = CountVectorizer(tokenizer=lambda s: s.split())

corpus = [s1, s2]

vectors = cv.fit_transform(corpus).toarray()



return np.dot(vectors[0], vectors[1]) / (norm(vectors[0]) * norm(vectors[1]))

for j in range(0,1):

for i in range(8371):

    titles.append(tf_similarity(str(document[i]), document[j]))





df = pd.DataFrame()

df["document"] = document

df["titles"] = titles

dff = df.sort_values("titles", ascending=False).head(6)

newdff=dff.values.T.tolist()

new=newdff[0]

for k in range(0,2):
boolist.append(new)

I would like my list look something like this:
book1 top1 top2 top3 top4 top5 top6
book2 top1 top2 top3 top4 top5 top6
Thank you so much for helping :)

edited Nov 25 '18 at 3:44

asked Nov 25 '18 at 0:54

Irene

def tf_similarity(s1, s2):

def add_space(s):

    return ' '.join(list(s))



s1, s2 = add_space(s1), add_space(s2)



cv = CountVectorizer(tokenizer=lambda s: s.split())

corpus = [s1, s2]

vectors = cv.fit_transform(corpus).toarray()



return np.dot(vectors[0], vectors[1]) / (norm(vectors[0]) * norm(vectors[1]))

for j in range(0,1):

for i in range(8371):

    titles.append(tf_similarity(str(document[i]), document[j]))





df = pd.DataFrame()

df["document"] = document

df["titles"] = titles

dff = df.sort_values("titles", ascending=False).head(6)

newdff=dff.values.T.tolist()

new=newdff[0]

for k in range(0,2):
boolist.append(new)

I would like my list look something like this:
book1 top1 top2 top3 top4 top5 top6
book2 top1 top2 top3 top4 top5 top6
Thank you so much for helping :)

python list dataframe tf

edited Nov 25 '18 at 3:44

asked Nov 25 '18 at 0:54

Irene

edited Nov 25 '18 at 3:44

asked Nov 25 '18 at 0:54

Irene

edited Nov 25 '18 at 3:44

asked Nov 25 '18 at 0:54

Irene

asked Nov 25 '18 at 0:54

Irene

asked Nov 25 '18 at 0:54

Irene

Please edit your code to make it properly indented so others will read and help you. Use 4 indents into the right to make it a code. Also use Python-specific indentation within your code to make it readable.

– dmitryro
Nov 25 '18 at 0:56

add a comment |

Please edit your code to make it properly indented so others will read and help you. Use 4 indents into the right to make it a code. Also use Python-specific indentation within your code to make it readable.

– dmitryro
Nov 25 '18 at 0:56

Please edit your code to make it properly indented so others will read and help you. Use 4 indents into the right to make it a code. Also use Python-specific indentation within your code to make it readable.

– dmitryro
Nov 25 '18 at 0:56

add a comment |

0

active

oldest

votes

Your Answer

StackExchange.ifUsing("editor", function () {
StackExchange.using("externalEditor", function () {
StackExchange.using("snippets", function () {
StackExchange.snippets.init();
});
});
}, "code-snippets");

StackExchange.ready(function() {
var channelOptions = {
tags: "".split(" "),
id: "1"
};
initTagRenderer("".split(" "), "".split(" "), channelOptions);

StackExchange.using("externalEditor", function() {
// Have to fire editor after snippets, if snippets enabled
if (StackExchange.settings.snippets.snippetsEnabled) {
StackExchange.using("snippets", function() {
createEditor();
});
}
else {
createEditor();
}
});

function createEditor() {
StackExchange.prepareEditor({
heartbeatType: 'answer',
autoActivateHeartbeat: false,
convertImagesToLinks: true,
noModals: true,
showLowRepImageUploadWarning: true,
reputationToPostImages: 10,
bindNavPrevention: true,
postfix: "",
imageUploader: {
brandingHtml: "Powered by u003ca class="icon-imgur-white" href="https://imgur.com/"u003eu003c/au003e",
contentPolicyHtml: "User contributions licensed under u003ca href="https://creativecommons.org/licenses/by-sa/3.0/"u003ecc by-sa 3.0 with attribution requiredu003c/au003e u003ca href="https://stackoverflow.com/legal/content-policy"u003e(content policy)u003c/au003e",
allowUrls: true
},
onDemand: true,
discardSelector: ".discard-answer"
,immediatelyShowMarkdownHelp:true
});

}
});

draft saved

draft discarded

Sign up or log in

StackExchange.ready(function () {
StackExchange.helpers.onClickDraftSave('#login-link');
});

Post as a guest

Name

Required, but never shown

StackExchange.ready(
function () {
StackExchange.openid.initPostLogin('.new-post-login', 'https%3a%2f%2fstackoverflow.com%2fquestions%2f53463768%2fdataframe-take-head-to-list-and-append%23new-answer', 'question_page');
}
);

Post as a guest

Name

Required, but never shown

0

active

oldest

votes

0

active

oldest

votes

draft saved

draft discarded

Thanks for contributing an answer to Stack Overflow!

Please be sure to answer the question. Provide details and share your research!

But avoid …

Asking for help, clarification, or responding to other answers.

Making statements based on opinion; back them up with references or personal experience.

To learn more, see our tips on writing great answers.

draft saved

draft discarded

Sign up or log in

StackExchange.ready(function () {
StackExchange.helpers.onClickDraftSave('#login-link');
});

Post as a guest

Name

Required, but never shown

Post as a guest

Name

Required, but never shown

Sign up or log in

StackExchange.ready(function () {
StackExchange.helpers.onClickDraftSave('#login-link');
});

Post as a guest

Name

Required, but never shown

Sign up or log in

StackExchange.ready(function () {
StackExchange.helpers.onClickDraftSave('#login-link');
});

Post as a guest

Name

Required, but never shown

Sign up or log in

StackExchange.ready(function () {
StackExchange.helpers.onClickDraftSave('#login-link');
});

Post as a guest

Name

Required, but never shown

Name

Required, but never shown

Name

Required, but never shown

This page is only for reference, If you need detailed information, please check here

搜尋此網誌

Nsryjdtyk