java多线程向数据库中加载数据
读取本地文件,每行为一条记录,文件大小550M,200万条数据。先将文件读取的内存中,再开启6个线程连接postgresql不同coordinator端口导入数据。代码如下:
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 | import java.io.BufferedReader; import java.io.FileInputStream; import java.io.InputStreamReader; import java.sql.Connection; import java.sql.DriverManager; import java.sql.PreparedStatement; import java.sql.SQLException; import java.util.ArrayList; import java.util.List; public class InsertThread implements Runnable { public static void main(String[] args) { // String file = "f://weibo.200w"; // String tb = "tb2"; // String ip = "102"; String file = args[ 0 ]; String tb = args[ 1 ]; String ip = args[ 2 ]; String[] port = { "2341" , "2342" , "2343" , "2344" , "2345" , "2346" }; List<String> list = null ; try { // 获得源数据 list = getContent(file); System.out.println(list.size()); } catch (Exception e) { // TODO Auto-generated catch block e.printStackTrace(); } InsertThread myThread1 = new InsertThread(); myThread1.setPramater(tb, ip, port[ 0 ], list); Thread thread1 = new Thread(myThread1); InsertThread myThread2 = new InsertThread(); myThread2.setPramater(tb, ip, port[ 1 ], list); Thread thread2 = new Thread(myThread2); InsertThread myThread3 = new InsertThread(); myThread3.setPramater(tb, ip, port[ 2 ], list); Thread thread3 = new Thread(myThread3); InsertThread myThread4 = new InsertThread(); myThread4.setPramater(tb, ip, port[ 3 ], list); Thread thread4 = new Thread(myThread4); InsertThread myThread5 = new InsertThread(); myThread5.setPramater(tb, ip, port[ 4 ], list); Thread thread5 = new Thread(myThread5); InsertThread myThread6 = new InsertThread(); myThread6.setPramater(tb, ip, port[ 5 ], list); Thread thread6 = new Thread(myThread6); thread1.start(); thread2.start(); thread3.start(); thread4.start(); thread5.start(); thread6.start(); } private String tb; private String ip; private String port; private List<String> list; public void setPramater(String tb, String ip, String port, List<String> list) { this .tb = tb; this .ip = ip; this .port = port; this .list = list; } public void run() { PreparedStatement ps = null ; String sql = null ; Connection conn = null ; try { Class.forName( "org.postgresql.Driver" ); String url = "jdbc:postgresql://192.168.8." + ip + ":" + port + "/postgres" ; try { conn = DriverManager.getConnection(url, "postgres" , "postgres" ); } catch (SQLException e) { e.printStackTrace(); } } catch (ClassNotFoundException e) { e.printStackTrace(); } int count = 0 ; try { conn.setAutoCommit( false ); sql = "insert into " + tb + " values(?,?,?,?,?,?,?::timestamptz,?,?,?,?,?,?,?,?,?,?,?,?,?,?,?,?,?,?,?,?,?,?,?,?,?,?,?,?,?,?,?)" ; ps = conn.prepareStatement(sql); } catch (SQLException e) { e.printStackTrace(); } Long beginTime = System.currentTimeMillis(); Long begin = System.currentTimeMillis(); for ( int i = 0 ; i < list.size(); i++) { String[] con = list.get(i).split( "," , - 1 ); if (con.length != 38 ) { continue ; } count++; try { for ( int j = 0 ; j < con.length; j++) { if (con[j] == null ) { ps.setString(j + 1 , "NULL" ); } else { ps.setString(j + 1 , con[j].trim()); } } ps.addBatch(); if (count > 0 && count % 10000 == 0 ) { // 可以设置不同的大小;如50,100,500,1000等等 ps.executeBatch(); conn.commit(); ps.clearBatch(); Long midTime = System.currentTimeMillis(); System.out.println( "-----------------" + count); System.out.println( "导入1万条数据性能" + ( 10000 * 1000 ) / (midTime - begin)); begin = midTime; } } catch (SQLException e) { e.printStackTrace(); continue ; } } try { ps.executeBatch(); conn.commit(); ps.clearBatch(); } catch (SQLException e) { e.printStackTrace(); } long sum = 1000 * count; long endTime = System.currentTimeMillis(); System.out.println( "pst+batch:" + count + "条" ); System.out.println( "pst+batch:" + (endTime - beginTime) / 1000 + "秒" ); System.out.println( "pst+batch:" + sum / (endTime - beginTime) + "条/秒" ); if (ps != null ) { try { ps.close(); } catch (SQLException e) { // TODO Auto-generated catch block e.printStackTrace(); } } if (conn != null ) { try { conn.close(); } catch (SQLException e) { // TODO Auto-generated catch block e.printStackTrace(); } } } public static List<String> getContent(String file) throws Exception { BufferedReader br = new BufferedReader( new InputStreamReader( new FileInputStream(file), "UTF-8" )); String line = br.readLine(); List<String> list = new ArrayList<String>(); while (line != null ) { list.add(line); line = br.readLine(); } br.close(); return list; } } |
【推荐】国内首个AI IDE,深度理解中文开发场景,立即下载体验Trae
【推荐】编程新体验,更懂你的AI,立即体验豆包MarsCode编程助手
【推荐】抖音旗下AI助手豆包,你的智能百科全书,全免费不限次数
【推荐】轻量又高性能的 SSH 工具 IShell:AI 加持,快人一步
· 如何编写易于单元测试的代码
· 10年+ .NET Coder 心语,封装的思维:从隐藏、稳定开始理解其本质意义
· .NET Core 中如何实现缓存的预热?
· 从 HTTP 原因短语缺失研究 HTTP/2 和 HTTP/3 的设计差异
· AI与.NET技术实操系列:向量存储与相似性搜索在 .NET 中的实现
· 周边上新:园子的第一款马克杯温暖上架
· Open-Sora 2.0 重磅开源!
· 分享 3 个 .NET 开源的文件压缩处理库,助力快速实现文件压缩解压功能!
· Ollama——大语言模型本地部署的极速利器
· DeepSeek如何颠覆传统软件测试?测试工程师会被淘汰吗?