目录
介绍
官网地址:https://github.com/facebookresearch/sam2
Segment Anything Model 2 (SAM 2) is a foundation model towards solving promptable visual segmentation in images and videos. We extend SAM to video by considering images as a video with a single frame. The model design is a simple transformer architecture with streaming memory for real-time video processing. We build a model-in-the-loop data engine, which improves model and data via user interaction, to collect our SA-V dataset, the largest video segmentation dataset to date. SAM 2 trained on our data provides strong performance across a wide range of tasks and visual domains.
效果
模型信息
sam2_hiera_small_encoder.onnx
Model Properties
-------------------------
---------------------------------------------------------------
Inputs
-------------------------
name:image
tensor:Float[1, 3, 1024, 1024]
---------------------------------------------------------------
Outputs
-------------------------
name:high_res_feats_0
tensor:Float[1, 32, 256, 256]
name:high_res_feats_1
tensor:Float[1, 64, 128, 128]
name:image_embed
tensor:Float[1, 256, 64, 64]
---------------------------------------------------------------
sam2_hiera_small_decoder.onnx
Model Properties
-------------------------
---------------------------------------------------------------
Inputs
-------------------------
name:image_embed
tensor:Float[1, 256, 64, 64]
name:high_res_feats_0
tensor:Float[1, 32, 256, 256]
name:high_res_feats_1
tensor:Float[1, 64, 128, 128]
name:point_coords
tensor:Float[-1, -1, 2]
name:point_labels
tensor:Float[-1, -1]
name:mask_input
tensor:Float[-1, 1, 256, 256]
name:has_mask_input
tensor:Float[-1]
name:orig_im_size
tensor:Int32[2]
---------------------------------------------------------------
Outputs
-------------------------
name:masks
tensor:Float[-1, -1, -1, -1]
name:iou_predictions
tensor:Float[-1, -1]
---------------------------------------------------------------
项目
代码
using OpenCvSharp;
using OpenCvSharp.Extensions;
using System;
using System.Collections.Generic;
using System.Drawing;
using System.Drawing.Imaging;
using System.Reflection;
using System.Windows.Forms;
namespace Onnx_Demo
{
public partial class Form1 : Form
{
public Form1()
{
InitializeComponent();
}
string fileFilter = "*.*|*.bmp;*.jpg;*.jpeg;*.tiff;*.tiff;*.png";
string image_path = "";
DateTime dt1 = DateTime.Now;
DateTime dt2 = DateTime.Now;
Mat image;
private void button1_Click(object sender, EventArgs e)
{
OpenFileDialog ofd = new OpenFileDialog();
ofd.Filter = fileFilter;
if (ofd.ShowDialog() != DialogResult.OK) return;
pictureBox1.Image = null;
image_path = ofd.FileName;
pictureBox1.Image = new Bitmap(image_path);
textBox1.Text = "";
image = new Mat(image_path);
pictureBox2.Image = null;
pictureBox3.Image = null;
sam.SetImage(image_path);
image = new Mat(image_path);
pictureBox1.Image = new Bitmap(image_path);
}
private void button2_Click(object sender, EventArgs e)
{
pictureBox3.Image = null;
button2.Enabled = false;
Application.DoEvents();
List
if (masks_list.Count > 0)
{
int MaxInde = 0;
float maxiou_pred = masks_list[0].iou_pred;
for (int i = 0; i < masks_list.Count; i++)
{
float temp = masks_list[i].iou_pred;
if (temp > maxiou_pred)
{
MaxInde = i;
}
}
pictureBox3.Image = BitmapConverter.ToBitmap(masks_list[MaxInde].mask);
}
button2.Enabled = true;
}
SamInferenceSession sam;
private void Form1_Load(object sender, EventArgs e)
{
string encoderPath = "model/sam2_hiera_small_encoder.onnx";
string decoderPath = "model/sam2_hiera_small_decoder.onnx";
sam = new SamInferenceSession(encoderPath, decoderPath);
sam.Initialize();
image_path = "test_img/1.jpg";
sam.SetImage(image_path);
image = new Mat(image_path);
pictureBox1.Image = new Bitmap(image_path);
}
private void pictureBox1_DoubleClick(object sender, EventArgs e)
{
Common.ShowNormalImg(pictureBox1.Image);
}
private void pictureBox2_DoubleClick(object sender, EventArgs e)
{
Common.ShowNormalImg(pictureBox2.Image);
}
SaveFileDialog sdf = new SaveFileDialog();
private void button3_Click(object sender, EventArgs e)
{
if (pictureBox2.Image == null)
{
return;
}
Bitmap output = new Bitmap(pictureBox2.Image);
sdf.Title = "保存";
sdf.Filter = "Images (*.jpg)|*.jpg|Images (*.png)|*.png|Images (*.bmp)|*.bmp|Images (*.emf)|*.emf|Images (*.exif)|*.exif|Images (*.gif)|*.gif|Images (*.ico)|*.ico|Images (*.tiff)|*.tiff|Images (*.wmf)|*.wmf";
if (sdf.ShowDialog() == DialogResult.OK)
{
switch (sdf.FilterIndex)
{
case 1:
{
output.Save(sdf.FileName, ImageFormat.Jpeg);
break;
}
case 2:
{
output.Save(sdf.FileName, ImageFormat.Png);
break;
}
case 3:
{
output.Save(sdf.FileName, ImageFormat.Bmp);
break;
}
case 4:
{
output.Save(sdf.FileName, ImageFormat.Emf);
break;
}
case 5:
{
output.Save(sdf.FileName, ImageFormat.Exif);
break;
}
case 6:
{
output.Save(sdf.FileName, ImageFormat.Gif);
break;
}
case 7:
{
output.Save(sdf.FileName, ImageFormat.Icon);
break;
}
case 8:
{
output.Save(sdf.FileName, ImageFormat.Tiff);
break;
}
case 9:
{
output.Save(sdf.FileName, ImageFormat.Wmf);
break;
}
}
MessageBox.Show("保存成功,位置:" + sdf.FileName);
}
}
bool m_mouseDown = false;
bool m_mouseMove = false;
System.Drawing.Point startPoint = new System.Drawing.Point();
System.Drawing.Point endPoint = new System.Drawing.Point();
Mat currentFrame = new Mat();
Rect roi = new Rect();
private void pictureBox1_MouseMove(object sender, MouseEventArgs e)
{
if (pictureBox1.Image == null)
return;
if (!m_mouseDown) return;
m_mouseMove = true;
endPoint = e.Location;
pictureBox1.Invalidate();
}
private void pictureBox1_Paint(object sender, PaintEventArgs e)
{
if (!m_mouseDown || !m_mouseMove)
return;
Graphics g = e.Graphics;
Pen p = new Pen(Color.Blue, 2);
Rectangle rect = new Rectangle(startPoint.X, startPoint.Y, (endPoint.X - startPoint.X), (endPoint.Y - startPoint.Y));
g.DrawRectangle(p, rect);
}
private void pictureBox1_MouseUp(object sender, MouseEventArgs e)
{
if (!m_mouseDown || !m_mouseMove)
return;
m_mouseDown = false;
m_mouseMove = false;
System.Drawing.Point image_startPoint = ConvertCooridinate(startPoint);
System.Drawing.Point image_endPoint = ConvertCooridinate(endPoint);
if (image_startPoint.X < 0)
image_startPoint.X = 0;
if (image_startPoint.Y < 0)
image_startPoint.Y = 0;
if (image_endPoint.X < 0)
image_endPoint.X = 0;
if (image_endPoint.Y < 0)
image_endPoint.Y = 0;
if (image_startPoint.X > image.Cols)
image_startPoint.X = image.Cols;
if (image_startPoint.Y > image.Rows)
image_startPoint.Y = image.Rows;
if (image_endPoint.X > image.Cols)
image_endPoint.X = image.Cols;
if (image_endPoint.Y > image.Rows)
image_endPoint.Y = image.Rows;
label1.Text = String.Format("ROI:({0},{1})-({2},{3})", image_startPoint.X, image_startPoint.Y, image_endPoint.X, image_endPoint.Y);
int w = (image_endPoint.X - image_startPoint.X);
int h = (image_endPoint.Y - image_startPoint.Y);
if (w > 10 && h > 10)
{
roi = new Rect(image_startPoint.X, image_startPoint.Y, w, h);
//Console.WriteLine(String.Format("ROI:({0},{1})-({2},{3})", image_startPoint.X, image_startPoint.Y, image_endPoint.X, image_endPoint.Y));
//test
//OpenCvSharp.Point pointinfo = new OpenCvSharp.Point(910, 641);
//roi = new Rect(pointinfo.X - 160, pointinfo.Y - 430, 380, 940);
Mat roi_mat = image[roi];
pictureBox2.Image = BitmapConverter.ToBitmap(roi_mat);
}
//pictureBox1.Invalidate();
}
private void pictureBox1_MouseDown(object sender, MouseEventArgs e)
{
if (pictureBox1.Image == null)
return;
m_mouseDown = true;
startPoint = e.Location;
}
private System.Drawing.Point ConvertCooridinate(System.Drawing.Point point)
{
System.Reflection.PropertyInfo rectangleProperty = this.pictureBox1.GetType().GetProperty("ImageRectangle", BindingFlags.Instance | BindingFlags.NonPublic);
Rectangle pictureBox = (Rectangle)rectangleProperty.GetValue(this.pictureBox1, null);
int zoomedWidth = pictureBox.Width;
int zoomedHeight = pictureBox.Height;
int imageWidth = pictureBox1.Image.Width;
int imageHeight = pictureBox1.Image.Height;
double zoomRatex = (double)(zoomedWidth) / (double)(imageWidth);
double zoomRatey = (double)(zoomedHeight) / (double)(imageHeight);
int black_left_width = (zoomedWidth == this.pictureBox1.Width) ? 0 : (this.pictureBox1.Width - zoomedWidth) / 2;
int black_top_height = (zoomedHeight == this.pictureBox1.Height) ? 0 : (this.pictureBox1.Height - zoomedHeight) / 2;
int zoomedX = point.X - black_left_width;
int zoomedY = point.Y - black_top_height;
System.Drawing.Point outPoint = new System.Drawing.Point();
outPoint.X = (int)((double)zoomedX / zoomRatex);
outPoint.Y = (int)((double)zoomedY / zoomRatey);
return outPoint;
}
}
}
- using OpenCvSharp;
- using OpenCvSharp.Extensions;
- using System;
- using System.Collections.Generic;
- using System.Drawing;
- using System.Drawing.Imaging;
- using System.Reflection;
- using System.Windows.Forms;
-
- namespace Onnx_Demo
- {
- public partial class Form1 : Form
- {
- public Form1()
- {
- InitializeComponent();
- }
-
- string fileFilter = "*.*|*.bmp;*.jpg;*.jpeg;*.tiff;*.tiff;*.png";
- string image_path = "";
- DateTime dt1 = DateTime.Now;
- DateTime dt2 = DateTime.Now;
- Mat image;
-
- private void button1_Click(object sender, EventArgs e)
- {
- OpenFileDialog ofd = new OpenFileDialog();
- ofd.Filter = fileFilter;
- if (ofd.ShowDialog() != DialogResult.OK) return;
- pictureBox1.Image = null;
- image_path = ofd.FileName;
- pictureBox1.Image = new Bitmap(image_path);
- textBox1.Text = "";
- image = new Mat(image_path);
- pictureBox2.Image = null;
- pictureBox3.Image = null;
-
- sam.SetImage(image_path);
- image = new Mat(image_path);
- pictureBox1.Image = new Bitmap(image_path);
- }
-
- private void button2_Click(object sender, EventArgs e)
- {
- pictureBox3.Image = null;
- button2.Enabled = false;
- Application.DoEvents();
- List<MatInfo> masks_list = sam.GetPointMask(roi);
- if (masks_list.Count > 0)
- {
- int MaxInde = 0;
- float maxiou_pred = masks_list[0].iou_pred;
- for (int i = 0; i < masks_list.Count; i++)
- {
- float temp = masks_list[i].iou_pred;
- if (temp > maxiou_pred)
- {
- MaxInde = i;
- }
- }
- pictureBox3.Image = BitmapConverter.ToBitmap(masks_list[MaxInde].mask);
- }
- button2.Enabled = true;
- }
-
- SamInferenceSession sam;
-
- private void Form1_Load(object sender, EventArgs e)
- {
- string encoderPath = "model/sam2_hiera_small_encoder.onnx";
- string decoderPath = "model/sam2_hiera_small_decoder.onnx";
-
- sam = new SamInferenceSession(encoderPath, decoderPath);
- sam.Initialize();
-
- image_path = "test_img/1.jpg";
-
- sam.SetImage(image_path);
- image = new Mat(image_path);
- pictureBox1.Image = new Bitmap(image_path);
-
- }
-
- private void pictureBox1_DoubleClick(object sender, EventArgs e)
- {
- Common.ShowNormalImg(pictureBox1.Image);
- }
-
- private void pictureBox2_DoubleClick(object sender, EventArgs e)
- {
- Common.ShowNormalImg(pictureBox2.Image);
- }
-
- SaveFileDialog sdf = new SaveFileDialog();
- private void button3_Click(object sender, EventArgs e)
- {
- if (pictureBox2.Image == null)
- {
- return;
- }
- Bitmap output = new Bitmap(pictureBox2.Image);
- sdf.Title = "保存";
- sdf.Filter = "Images (*.jpg)|*.jpg|Images (*.png)|*.png|Images (*.bmp)|*.bmp|Images (*.emf)|*.emf|Images (*.exif)|*.exif|Images (*.gif)|*.gif|Images (*.ico)|*.ico|Images (*.tiff)|*.tiff|Images (*.wmf)|*.wmf";
- if (sdf.ShowDialog() == DialogResult.OK)
- {
- switch (sdf.FilterIndex)
- {
- case 1:
- {
- output.Save(sdf.FileName, ImageFormat.Jpeg);
- break;
- }
- case 2:
- {
- output.Save(sdf.FileName, ImageFormat.Png);
- break;
- }
- case 3:
- {
- output.Save(sdf.FileName, ImageFormat.Bmp);
- break;
- }
- case 4:
- {
- output.Save(sdf.FileName, ImageFormat.Emf);
- break;
- }
- case 5:
- {
- output.Save(sdf.FileName, ImageFormat.Exif);
- break;
- }
- case 6:
- {
- output.Save(sdf.FileName, ImageFormat.Gif);
- break;
- }
- case 7:
- {
- output.Save(sdf.FileName, ImageFormat.Icon);
- break;
- }
-
- case 8:
- {
- output.Save(sdf.FileName, ImageFormat.Tiff);
- break;
- }
- case 9:
- {
- output.Save(sdf.FileName, ImageFormat.Wmf);
- break;
- }
- }
- MessageBox.Show("保存成功,位置:" + sdf.FileName);
- }
- }
-
- bool m_mouseDown = false;
- bool m_mouseMove = false;
-
- System.Drawing.Point startPoint = new System.Drawing.Point();
- System.Drawing.Point endPoint = new System.Drawing.Point();
-
- Mat currentFrame = new Mat();
- Rect roi = new Rect();
-
- private void pictureBox1_MouseMove(object sender, MouseEventArgs e)
- {
- if (pictureBox1.Image == null)
- return;
- if (!m_mouseDown) return;
-
- m_mouseMove = true;
- endPoint = e.Location;
-
- pictureBox1.Invalidate();
-
- }
-
- private void pictureBox1_Paint(object sender, PaintEventArgs e)
- {
- if (!m_mouseDown || !m_mouseMove)
- return;
- Graphics g = e.Graphics;
- Pen p = new Pen(Color.Blue, 2);
- Rectangle rect = new Rectangle(startPoint.X, startPoint.Y, (endPoint.X - startPoint.X), (endPoint.Y - startPoint.Y));
- g.DrawRectangle(p, rect);
- }
-
- private void pictureBox1_MouseUp(object sender, MouseEventArgs e)
- {
- if (!m_mouseDown || !m_mouseMove)
- return;
- m_mouseDown = false;
- m_mouseMove = false;
-
- System.Drawing.Point image_startPoint = ConvertCooridinate(startPoint);
- System.Drawing.Point image_endPoint = ConvertCooridinate(endPoint);
- if (image_startPoint.X < 0)
- image_startPoint.X = 0;
- if (image_startPoint.Y < 0)
- image_startPoint.Y = 0;
- if (image_endPoint.X < 0)
- image_endPoint.X = 0;
- if (image_endPoint.Y < 0)
- image_endPoint.Y = 0;
- if (image_startPoint.X > image.Cols)
- image_startPoint.X = image.Cols;
- if (image_startPoint.Y > image.Rows)
- image_startPoint.Y = image.Rows;
- if (image_endPoint.X > image.Cols)
- image_endPoint.X = image.Cols;
- if (image_endPoint.Y > image.Rows)
- image_endPoint.Y = image.Rows;
-
- label1.Text = String.Format("ROI:({0},{1})-({2},{3})", image_startPoint.X, image_startPoint.Y, image_endPoint.X, image_endPoint.Y);
- int w = (image_endPoint.X - image_startPoint.X);
- int h = (image_endPoint.Y - image_startPoint.Y);
- if (w > 10 && h > 10)
- {
- roi = new Rect(image_startPoint.X, image_startPoint.Y, w, h);
- //Console.WriteLine(String.Format("ROI:({0},{1})-({2},{3})", image_startPoint.X, image_startPoint.Y, image_endPoint.X, image_endPoint.Y));
- //test
- //OpenCvSharp.Point pointinfo = new OpenCvSharp.Point(910, 641);
- //roi = new Rect(pointinfo.X - 160, pointinfo.Y - 430, 380, 940);
- Mat roi_mat = image[roi];
- pictureBox2.Image = BitmapConverter.ToBitmap(roi_mat);
- }
- //pictureBox1.Invalidate();
-
- }
-
- private void pictureBox1_MouseDown(object sender, MouseEventArgs e)
- {
- if (pictureBox1.Image == null)
- return;
- m_mouseDown = true;
- startPoint = e.Location;
- }
-
- private System.Drawing.Point ConvertCooridinate(System.Drawing.Point point)
- {
- System.Reflection.PropertyInfo rectangleProperty = this.pictureBox1.GetType().GetProperty("ImageRectangle", BindingFlags.Instance | BindingFlags.NonPublic);
- Rectangle pictureBox = (Rectangle)rectangleProperty.GetValue(this.pictureBox1, null);
-
- int zoomedWidth = pictureBox.Width;
- int zoomedHeight = pictureBox.Height;
-
- int imageWidth = pictureBox1.Image.Width;
- int imageHeight = pictureBox1.Image.Height;
-
- double zoomRatex = (double)(zoomedWidth) / (double)(imageWidth);
- double zoomRatey = (double)(zoomedHeight) / (double)(imageHeight);
- int black_left_width = (zoomedWidth == this.pictureBox1.Width) ? 0 : (this.pictureBox1.Width - zoomedWidth) / 2;
- int black_top_height = (zoomedHeight == this.pictureBox1.Height) ? 0 : (this.pictureBox1.Height - zoomedHeight) / 2;
-
- int zoomedX = point.X - black_left_width;
- int zoomedY = point.Y - black_top_height;
-
- System.Drawing.Point outPoint = new System.Drawing.Point();
- outPoint.X = (int)((double)zoomedX / zoomRatex);
- outPoint.Y = (int)((double)zoomedY / zoomRatey);
-
- return outPoint;
- }
-
- }
- }
下载
其他


评论记录:
回复评论: