open(FILE, "C:/Users/li/data_collection/posts/165644996453.html"); while () { if ( /(?<=

)(.*)(?=<\/p>\s+